dlmm_data_collector.py

import requests
import pandas as pd
import numpy as np
import json
from datetime import datetime, timezone, timedelta
import time
import logging
import os
from rich.console import Console
from rich.logging import RichHandler
from rich.panel import Panel
from rich.text import Text
from rich.live import Live
from rich.table import Table
from rich.box import ROUNDED
from ratelimit import limits, sleep_and_retry
from requests.exceptions import RequestException
import random
import sys
import traceback
import msvcrt
from scipy import stats
from sklearn.preprocessing import StandardScaler
from sklearn.ensemble import RandomForestRegressor
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score
from dtaidistance import dtw
from pykalman import KalmanFilter
from arch import arch_model
from json import JSONEncoder
import threading
from colorama import init, Fore, Back, Style
from rich.progress import Progress, TextColumn, BarColumn, TimeRemainingColumn
from rich.panel import Panel
from rich.table import Table
from rich.console import Console
import time
from contextlib import nullcontext
import queue
import threading
import time


data_pull_lock = threading.Lock()


console = Console()
# Initialize colorama
init(autoreset=True)

# Set up rich console and logging
console = Console()
logging.basicConfig(level="INFO", format="%(message)s", datefmt="[%X]", 
                    handlers=[RichHandler(rich_tracebacks=True, console=console)])
log = logging.getLogger("rich")

BASE_URL = "https://api.geckoterminal.com/api/v2"

class NumpyEncoder(JSONEncoder):
    def default(self, obj):
        if isinstance(obj, np.integer):
            return int(obj)
        elif isinstance(obj, np.floating):
            return float(obj)
        elif isinstance(obj, np.ndarray):
            return obj.tolist()
        return JSONEncoder.default(self, obj)

class DataManager:
    def __init__(self):
        self.df = None
        self.last_update = None

    def load_data(self):
        if self.df is None or (datetime.now() - self.last_update) > timedelta(minutes=30):
            console.print("Loading data from CSV file...")
            self.df = pd.read_csv('meme_coin_data.csv')
            console.print(f"Loaded {len(self.df)} rows of data")
            
            self.df['timestamp'] = pd.to_datetime(self.df['timestamp'], errors='coerce')
            
            invalid_timestamps = self.df['timestamp'].isnull()
            if invalid_timestamps.any():
                console.print(f"[yellow]Dropped {invalid_timestamps.sum()} rows with invalid timestamps[/yellow]")
                self.df = self.df.dropna(subset=['timestamp'])
            
            self.last_update = datetime.now()
            console.print("Data loading complete")

    def get_recent_data(self):
        seven_days_ago = datetime.now(timezone.utc) - timedelta(days=7)
        return self.df[self.df['timestamp'] > seven_days_ago]

data_manager = DataManager()

class GlobalState:
    def __init__(self):
        self.last_pull_time = datetime.now()

global_state = GlobalState()

import queue
import threading
import time

request_queue = queue.Queue()
RATE_LIMIT = 20  # Calls per minute, set lower than the actual limit for safety
DELAY = 60 / RATE_LIMIT  # Delay between each request

def process_queue():
    while True:
        request = request_queue.get()
        if request is None:
            break
        url, params, callback = request
        try:
            response = requests.get(url, headers={'accept': 'application/json'}, params=params, timeout=30)
            response.raise_for_status()
            callback(response.json())
        except Exception as e:
            log.error(f"Error processing request: {str(e)}")
        finally:
            request_queue.task_done()
        time.sleep(DELAY)

# Start the queue processor thread
queue_thread = threading.Thread(target=process_queue, daemon=True)
queue_thread.start()

@sleep_and_retry
@limits(calls=20, period=60)
def call_api_with_retry(url, params=None, max_retries=5):
    for attempt in range(max_retries):
        try:
            response = requests.get(url, headers={'accept': 'application/json'}, params=params, timeout=30)
            response.raise_for_status()
            return response.json()
        except RequestException as e:
            if response.status_code == 429 or (500 <= response.status_code < 600):
                sleep_time = min(30, (2 ** attempt) + random.uniform(0, 1))
                log.warning(f"Rate limit hit or server error. Retrying in {sleep_time:.2f} seconds...")
                time.sleep(sleep_time)
            elif response.status_code == 400:
                log.error(f"Bad request for URL: {url}")
                return None
            else:
                raise
    raise Exception("Max retries reached")

def get_trending_pools(network='solana', page=1):
    url = f"{BASE_URL}/networks/{network}/trending_pools"
    return call_api_with_retry(url, params={'page': page})

def get_pool_info(network, pool_address):
    url = f"{BASE_URL}/networks/{network}/pools/{pool_address}"
    return call_api_with_retry(url, params={'include': 'base_token'})

def get_ohlcv_data(network, pool_address):
    ohlcv_data = {}
    timeframes = [
        ('day', 1, 30), ('hour', 4, 42), ('hour', 1, 24)
    ]
    for timeframe, aggregate, limit in timeframes:
        url = f"{BASE_URL}/networks/{network}/pools/{pool_address}/ohlcv/{timeframe}"
        params = {'aggregate': aggregate, 'limit': limit, 'currency': 'usd', 'token': 'base'}
        try:
            response = call_api_with_retry(url, params)
            ohlcv_data[timeframe] = response
            time.sleep(2)  # Add a 2-second delay between API calls
        except Exception as e:
            log.error(f"Failed to get OHLCV data for {pool_address} ({timeframe}): {str(e)}")
    return ohlcv_data

def calculate_ohlcv_metrics(ohlcv_data):
    metrics = {}
    for timeframe, data in ohlcv_data.items():
        if 'data' not in data or 'attributes' not in data['data'] or 'ohlcv_list' not in data['data']['attributes']:
            continue
        
        ohlcv_list = data['data']['attributes']['ohlcv_list']
        if not ohlcv_list:
            continue
        
        closes = [item[4] for item in ohlcv_list]
        volumes = [item[5] for item in ohlcv_list]
        
        avg_volume = np.mean(volumes)
        volatility = np.std(np.log(np.array(closes[1:]) / np.array(closes[:-1])))
        
        period = '30d' if timeframe == 'day' else '7d' if timeframe == 'hour' and len(ohlcv_list) > 24 else '24h'
        
        metrics.update({
            f'avg_{timeframe}_volume': avg_volume,
            f'{period}_volatility': volatility,
            f'price_{period}_ago': closes[-1] if closes else None,
            f'price_change_{period}': ((closes[0] / closes[-1]) - 1) * 100 if len(closes) > 1 else None
        })
    return metrics


console = Console()

def collect_data():
    # Define scoring weights
    weights = {
        'price_momentum': 0.20,
        'price_reversion': 0.20,
        'volume_acceleration': 0.25,
        'market_cap': 0.10,
        'volatility': 0.20,
        'liquidity_ratio': 0.05
    }

    # Display score interpretation ranges and scoring weights at the beginning
    score_ranges = f"""[bold underline]Score Interpretation[/bold underline]
[green]80-100[/green]: Exceptional performance across all factors
[light_green]60-80[/light_green]: Strong performance
[yellow]40-60[/yellow]: Average performance
[orange1]20-40[/orange1]: Below average performance
[red]0-20[/red]: Poor performance

[bold underline]Scoring System Weights[/bold underline]
Price Momentum: {weights['price_momentum'] * 100:.0f}%
Price Reversion: {weights['price_reversion'] * 100:.0f}%
Volume Acceleration: {weights['volume_acceleration'] * 100:.0f}%
Market Cap: {weights['market_cap'] * 100:.0f}%
Volatility: {weights['volatility'] * 100:.0f}%
Liquidity Ratio: {weights['liquidity_ratio'] * 100:.0f}%

[bold yellow]Note:[/bold yellow] Data collection may take up to 8 minutes due to public API rate limits.

The multifactor score evaluates tokens based on recent price momentum, potential for price reversals, volume trends, market cap, and volatility. A higher score suggests a token may be entering a phase of increased trading activity and price movement. For LP providers, this could indicate a good opportunity to earn fees from heightened trading volume while the token's price dynamics remain favorable. However, always combine this score with your own research and risk assessment before making LP decisions
"""
    console.print(Panel(score_ranges, style="bold cyan"))

    console.print(Panel("Starting data collection...", style="bold green"))
    all_data = []
    skipped_tokens = []
    tokens_for_table = []

    # Determine if the current thread is the main thread
    is_main_thread = threading.current_thread() == threading.main_thread()
    if is_main_thread:
        progress_context = Progress(
            TextColumn("[progress.description]{task.description}"),
            BarColumn(),
            TextColumn("[progress.percentage]{task.percentage:>3.0f}%"),
            TimeRemainingColumn(),
            console=console,
        )
    else:
        # Use a no-op context manager for the background thread
        progress_context = nullcontext()

    with progress_context as progress:
        if is_main_thread:
            total_tokens = 0
            for page in [1, 2]:
                try:
                    trending_pools = get_trending_pools(network='solana', page=page)
                    if 'data' not in trending_pools:
                        console.print(f"[bold red]Unexpected response structure for page {page}:[/bold red] {trending_pools}")
                        continue
                    total_tokens += len(trending_pools['data'])
                except Exception as e:
                    console.print(f"[bold red]Error fetching trending pools for page {page}:[/bold red] {str(e)}")
                    continue

            overall_task = progress.add_task("[cyan]Collecting Data", total=total_tokens)
        else:
            total_tokens = 0
            overall_task = None

        for page in [1, 2]:
            try:
                trending_pools = get_trending_pools(network='solana', page=page)
                if 'data' not in trending_pools:
                    console.print(f"[bold red]Unexpected response structure for page {page}:[/bold red] {trending_pools}")
                    continue
            except Exception as e:
                console.print(f"[bold red]Error fetching trending pools for page {page}:[/bold red] {str(e)}")
                continue

            for pool in trending_pools['data']:
                try:
                    pool_attributes = pool['attributes']
                    token_name = pool_attributes.get('name', 'Unknown')
                    network = 'solana'
                    pool_address = pool_attributes.get('address', 'Unknown')

                    if is_main_thread and progress is not None and overall_task is not None:
                        progress.update(overall_task, description=f"[cyan]Processing: {token_name}")
                    else:
                        console.print(f"Processing: {token_name}")

                    # Fetch additional pool info and OHLCV data
                    pool_info = get_pool_info(network, pool_address)
                    ohlcv_data = get_ohlcv_data(network, pool_address)
                    metrics = calculate_ohlcv_metrics(ohlcv_data)

                    current_time = datetime.now(timezone.utc)
                    pool_created_at_str = pool_attributes.get('pool_created_at', current_time.isoformat())
                    try:
                        pool_created_at = datetime.fromisoformat(pool_created_at_str.replace('Z', '+00:00'))
                    except ValueError:
                        pool_created_at = current_time
                    pool_age_hours = (current_time - pool_created_at).total_seconds() / 3600

                    # Extract necessary data
                    price_change_percentage = pool_attributes.get('price_change_percentage', {})
                    volume_usd = pool_attributes.get('volume_usd', {})
                    transactions = pool_attributes.get('transactions', {})

                    # Prepare pool_data with all specified fields
                    pool_data = {
    'timestamp': current_time.isoformat(),
    'token_name': token_name,
    'network': network,
    'token_price': float(pool_attributes.get('base_token_price_usd', 0)),
    'market_cap': float(pool_attributes.get('market_cap_usd', 0) or 0),
    'fdv': float(pool_attributes.get('fdv_usd', 0) or 0),
    'liquidity': float(pool_attributes.get('reserve_in_usd', 0) or 0),
    'volume_5m': float(volume_usd.get('m5', 0) or 0),
    'volume_1h': float(volume_usd.get('h1', 0) or 0),
    'volume_6h': float(volume_usd.get('h6', 0) or 0),
    'volume_24h': float(volume_usd.get('h24', 0) or 0),
    'price_change_5m': float(price_change_percentage.get('m5', 0) or 0),
    'price_change_1h': float(price_change_percentage.get('h1', 0) or 0),
    'price_change_6h': float(price_change_percentage.get('h6', 0) or 0),
    'price_change_24h': float(price_change_percentage.get('h24', 0) or 0),
    'pool_created_at': pool_created_at.isoformat(),
    'pool_age_hours': pool_age_hours,
}

                    # Ensure 'market_cap' has a value
                    pool_data['market_cap'] = pool_data['market_cap'] or pool_data['fdv']
                    pool_data['effective_market_cap'] = pool_data['market_cap']

                    # Add metrics from OHLCV data
                    pool_data.update(metrics)

                    # Extract scalar values for multifactor score
                    price_momentum = float(pool_data['price_change_24h'])
                    volume_1h = float(pool_data['volume_1h'])
                    volume_24h = float(pool_data['volume_24h'])
                    market_cap = float(pool_data['effective_market_cap'])
                    
                    # Calculate volatility using the existing method in your script
                    historical_prices = [float(item[4]) for timeframe_data in ohlcv_data.values()
                                         if 'data' in timeframe_data and 'attributes' in timeframe_data['data']
                                         and 'ohlcv_list' in timeframe_data['data']['attributes']
                                         for item in timeframe_data['data']['attributes']['ohlcv_list']]
                    volatility = np.std(np.diff(np.log(historical_prices))) if len(historical_prices) > 1 else 0.1
                    
                    liquidity_ratio = volume_24h / market_cap if market_cap > 0 else 0

                    try:
                        mf_score = multifactor_score(
                            price_momentum=float(pool_data['price_change_24h']),
                            volume_1h=float(pool_data['volume_1h']),
                            volume_24h=float(pool_data['volume_24h']),
                            market_cap=float(pool_data['effective_market_cap']),
                            volatility=volatility,
                            liquidity_ratio=liquidity_ratio,
                            ohlcv_metrics=ohlcv_data
                        )
                        pool_data['multifactor_score'] = mf_score
                    except Exception as score_error:
                        console.print(f"[yellow]Error calculating multifactor score for {token_name}: {str(score_error)}[/yellow]")
                        mf_score = 0
                        pool_data['multifactor_score'] = mf_score

                    all_data.append(pool_data)

                    # Collect data for the table
                    tokens_for_table.append({
                        'Token Name': token_name,
                        'Network': network.upper(),
                        'Price (USD)': f"${pool_data['token_price']:.6f}",
                        'Market Cap (USD)': f"${pool_data['market_cap']:,.2f}",
                        'Volume 24h (USD)': f"${pool_data['volume_24h']:,.2f}",
                        'Liquidity (USD)': f"${pool_data['liquidity']:,.2f}",
                        'Change 24h (%)': f"{pool_data['price_change_24h']:.2f}%",
                        'Score': f"{mf_score:.2f}"
                    })

                    if is_main_thread and progress is not None and overall_task is not None:
                        progress.update(overall_task, advance=1)
                    else:
                        pass  # Optionally, print minimal progress in the background thread

                    time.sleep(1)  # Add a small delay between processing each pool

                except KeyError as e:
                    skipped_tokens.append(token_name)
                    console.print(f"[yellow]Skipping token {token_name} due to missing data: {str(e)}[/yellow]")
                    if is_main_thread and progress is not None and overall_task is not None:
                        progress.update(overall_task, advance=1)
                    else:
                        pass
                except Exception as e:
                    console.print(f"[red]Error processing pool {pool_attributes.get('address', 'Unknown')}: {str(e)}[/red]")
                    console.print(f"[yellow]Pool attributes: {json.dumps(pool_attributes, indent=2)}[/yellow]")
                    if is_main_thread and progress is not None and overall_task is not None:
                        progress.update(overall_task, advance=1)
                    else:
                        pass

        console.print(Panel("Data collection completed!", style="bold green"))

        # Convert to DataFrame and sort by multifactor score
        df = pd.DataFrame(all_data)
        df = df.sort_values('multifactor_score', ascending=False)

        # Save to CSV
        file_exists = os.path.isfile('meme_coin_data.csv')
        if not file_exists:
            df.to_csv('meme_coin_data.csv', mode='w', header=True, index=False)
            console.print(f"[green]Created new meme_coin_data.csv with {len(df)} records[/green]")
        else:
            df.to_csv('meme_coin_data.csv', mode='a', header=False, index=False)
            console.print(f"[green]Appended {len(df)} new records to meme_coin_data.csv[/green]")

        console.print(f"[yellow]Skipped {len(skipped_tokens)} tokens due to missing data: {', '.join(skipped_tokens)}[/yellow]")

        if is_main_thread:
            # Display the collected tokens in a table format
            table = Table(title="Token Data", show_lines=True)

            table.add_column("Token Name", style="bold cyan")
            table.add_column("Network", style="bold magenta")
            table.add_column("Price (USD)", justify="right")
            table.add_column("Market Cap (USD)", justify="right")
            table.add_column("Volume 24h (USD)", justify="right")
            table.add_column("Liquidity (USD)", justify="right")
            table.add_column("Change 24h (%)", justify="right")
            table.add_column("Score", justify="right")

            for token in tokens_for_table:
                price_change_color = "green" if float(token['Change 24h (%)'].strip('%')) >= 0 else "red"
                score_value = float(token['Score'])
                score_color = (
                    "green" if score_value >= 80 else
                    "light_green" if score_value >= 60 else
                    "yellow" if score_value >= 40 else
                    "orange1" if score_value >= 20 else
                    "red"
                )

                table.add_row(
                    token['Token Name'],
                    token['Network'],
                    token['Price (USD)'],
                    token['Market Cap (USD)'],
                    token['Volume 24h (USD)'],
                    token['Liquidity (USD)'],
                    f"[{price_change_color}]{token['Change 24h (%)']}[/]",
                    f"[{score_color}]{token['Score']}[/]"
                )

            console.print(table)

            # Optionally, display the top 5 tokens with highest scores
            top_5 = df.head(5)
            top_table = Table(title="Top 5 Tokens by Multifactor Score", show_lines=True)

            top_table.add_column("Rank", style="bold magenta")
            top_table.add_column("Token Name", style="bold cyan")
            top_table.add_column("Price (USD)", justify="right")
            top_table.add_column("Market Cap (USD)", justify="right")
            top_table.add_column("Volume 24h (USD)", justify="right")
            top_table.add_column("Liquidity (USD)", justify="right")
            top_table.add_column("Change 24h (%)", justify="right")
            top_table.add_column("Score", justify="right")

            for rank, (_, row) in enumerate(top_5.iterrows(), start=1):
                price_change_color = "green" if row['price_change_24h'] >= 0 else "red"
                score_color = (
                    "green" if row['multifactor_score'] >= 80 else
                    "light_green" if row['multifactor_score'] >= 60 else
                    "yellow" if row['multifactor_score'] >= 40 else
                    "orange1" if row['multifactor_score'] >= 20 else
                    "red"
                )
                top_table.add_row(
                    str(rank),
                    row['token_name'],
                    f"${row['token_price']:.6f}",
                    f"${row['market_cap']:,.2f}",
                    f"${row['volume_24h']:,.2f}",
                    f"${row['liquidity']:,.2f}",
                    f"[{price_change_color}]{row['price_change_24h']:.2f}%[/]",
                    f"[{score_color}]{row['multifactor_score']:.2f}[/]"
                )

            console.print(top_table)

        # Load data into the data manager if needed
        data_manager.load_data()


def display_summary(df):
    console.print("\n[bold cyan]Data Collection Summary:[/bold cyan]")
    console.print(f"Total Tokens Processed: {len(df)}")
    console.print(f"\n[bold cyan]Score Distribution:[/bold cyan]")
    console.print(f"0-20 (Low performing): [red]{len(df[df['multifactor_score'] <= 20])}[/red]")
    console.print(f"21-40 (Below average): [yellow]{len(df[(df['multifactor_score'] > 20) & (df['multifactor_score'] <= 40)])}[/yellow]")
    console.print(f"41-60 (Average): [cyan]{len(df[(df['multifactor_score'] > 40) & (df['multifactor_score'] <= 60)])}[/cyan]")
    console.print(f"61-80 (Above average): [green]{len(df[(df['multifactor_score'] > 60) & (df['multifactor_score'] <= 80)])}[/green]")
    console.print(f"81-100 (High performing): [bold green]{len(df[df['multifactor_score'] > 80])}[/bold green]")

    console.print("\n[bold cyan]Top 10 Tokens by Score:[/bold cyan]")
    top_10 = df.nlargest(10, 'multifactor_score')
    for _, row in top_10.iterrows():
        score = row['multifactor_score']
        if score <= 20:
            score_color = "red"
        elif score <= 40:
            score_color = "yellow"
        elif score <= 60:
            score_color = "cyan"
        elif score <= 80:
            score_color = "green"
        else:
            score_color = "bold green"
        console.print(f"{row['token_name']:20} Score: [{score_color}]{score:.2f}[/{score_color}]")

def process_pool_data(pool_attributes):
    # This function would contain the detailed data processing logic
    # Simplified for brevity
    return {
        'token_name': pool_attributes.get('name', 'Unknown'),
        'token_price': float(pool_attributes.get('base_token_price_usd', 0)),
        'market_cap': float(pool_attributes.get('market_cap_usd', 0) or 0),
        # Add other necessary fields here
    }

def save_to_csv(df):
    file_exists = os.path.isfile('meme_coin_data.csv')
    if not file_exists:
        df.to_csv('meme_coin_data.csv', mode='w', header=True, index=False)
        console.print("[green]Created new meme_coin_data.csv[/green]")
    else:
        df.to_csv('meme_coin_data.csv', mode='a', header=False, index=False)
        console.print("[green]Appended new records to meme_coin_data.csv[/green]")


import numpy as np
import logging

logger = logging.getLogger(__name__)

import numpy as np

def multifactor_score(price_momentum, volume_1h, volume_24h, market_cap, volatility, liquidity_ratio, ohlcv_metrics):
    try:
        # Define weights
        weights = {
            'price_momentum': 0.25,
            'price_reversion': 0.20,
            'volume_acceleration': 0.30,
            'market_cap': 0.05,
            'volatility': 0.15,
            'liquidity_ratio': 0.05
        }

        # Calculate factors
        norm_price_momentum = normalize_price_momentum(price_momentum)
        norm_price_reversion = calculate_price_reversion(ohlcv_metrics)
        norm_volume_acceleration = calculate_volume_acceleration(ohlcv_metrics)
        norm_market_cap = normalize_market_cap(market_cap)
        norm_volatility = normalize_volatility_for_lp(volatility, price_momentum)
        norm_liquidity_ratio = normalize_liquidity_ratio(liquidity_ratio)

        # Calculate weighted score
        weighted_scores = {
            'price_momentum': norm_price_momentum * weights['price_momentum'],
            'price_reversion': norm_price_reversion * weights['price_reversion'],
            'volume_acceleration': norm_volume_acceleration * weights['volume_acceleration'],
            'market_cap': norm_market_cap * weights['market_cap'],
            'volatility': norm_volatility * weights['volatility'],
            'liquidity_ratio': norm_liquidity_ratio * weights['liquidity_ratio']
        }

        raw_score = sum(weighted_scores.values())

        # Apply sigmoid function for final score
        final_score = 100 / (1 + np.exp(-12 * (raw_score - 0.5)))

        return final_score
    except Exception as e:
        logger.error(f"Error calculating multifactor score: {str(e)}")
        return 0

def normalize_price_momentum(x):
    return np.clip((np.tanh(x / 30) + 1) / 2, 0, 1)

def calculate_price_reversion(ohlcv_metrics):
    daily_data = ohlcv_metrics.get('day', {}).get('ohlcv_list', [])
    if len(daily_data) < 3:
        return 0.5  # Neutral score if not enough data
    
    closing_prices = [float(day[4]) for day in daily_data]
    recent_change = (closing_prices[-1] - closing_prices[-2]) / closing_prices[-2]
    avg_change = np.mean(np.diff(closing_prices) / closing_prices[:-1])
    
    reversion_potential = (avg_change - recent_change) / max(abs(avg_change), abs(recent_change))
    return np.clip((np.tanh(reversion_potential) + 1) / 2, 0, 1)

def calculate_volume_acceleration(ohlcv_metrics):
    hourly_data = ohlcv_metrics.get('hour', {}).get('ohlcv_list', [])
    if len(hourly_data) < 24:
        return 0.5  # Neutral score if not enough data
    
    volumes = [float(hour[5]) for hour in hourly_data[-24:]]  # Last 24 hours
    volume_change = (volumes[-1] - volumes[0]) / volumes[0]
    volume_acceleration = (volumes[-1] - 2*volumes[-12] + volumes[-24]) / volumes[-24]
    
    return np.clip((np.tanh(volume_acceleration * 10) + 1) / 2, 0, 1)

def normalize_market_cap(x):
    return np.clip(np.log10(x) / 12, 0, 1)

def normalize_volatility_for_lp(volatility, price_momentum):
    optimal_volatility = 0.1
    volatility_score = 1 - abs(volatility - optimal_volatility) / max(volatility, optimal_volatility)
    return np.clip(volatility_score * 1.5, 0, 1)

def normalize_liquidity_ratio(x):
    return np.clip(x / 0.3, 0, 1)


def implement_garch(historical_prices):
    """
    Calculates volatility using the GARCH model.
    
    Parameters:
    - historical_prices (list): List of historical price data.
    
    Returns:
    - volatility_forecast (float): The forecasted volatility.
    """
    try:
        # Convert prices to a numpy array
        historical_prices = np.array(historical_prices, dtype=float)
        # Ensure prices are positive
        historical_prices = historical_prices[historical_prices > 0]
        if len(historical_prices) < 2:
            console.print("[yellow]Warning: Not enough positive price data for volatility calculation.[/yellow]")
            return 0

        # Calculate log returns
        returns = np.diff(np.log(historical_prices))
        returns = returns[np.isfinite(returns)]  # Remove NaNs and infs

        if len(returns) < 100:
            console.print("[yellow]Warning: Insufficient data for GARCH modeling. Using standard deviation.[/yellow]")
            return np.std(returns) if len(returns) > 1 else 0

        model = arch_model(returns, vol='GARCH', p=1, q=1)
        results = model.fit(disp='off')
        forecast = results.forecast(horizon=1)
        volatility_forecast = np.sqrt(forecast.variance.values[-1, :])[0]

        console.print(f"[green]Successfully calculated GARCH volatility: {volatility_forecast:.4f}[/green]")
        return volatility_forecast
    except Exception as e:
        console.print(f"[yellow]Warning: GARCH modeling failed. Using standard deviation. Error: {str(e)}[/yellow]")
        returns = np.diff(np.log(historical_prices))
        return np.std(returns) if len(returns) > 1 else 0

def kalman_trend(prices):
    kf = KalmanFilter(transition_matrices=[1], observation_matrices=[1], 
                      initial_state_mean=0, initial_state_covariance=1, 
                      observation_covariance=1, transition_covariance=.01)
    return kf.filter(prices)[0].flatten()

def estimate_tail_risk(returns, threshold=0.05):
    try:
        valid_returns = returns[np.isfinite(returns)]
        
        if len(valid_returns) < 10:
            console.print("[yellow]Warning: Not enough valid data for tail risk estimation.[/yellow]")
            return None, None

        tail_returns = valid_returns[valid_returns < np.quantile(valid_returns, threshold)]
        
        if len(tail_returns) < 5:
            console.print("[yellow]Warning: Not enough tail data for estimation.[/yellow]")
            return None, None

        shape, _, scale = stats.genpareto.fit(tail_returns)
        return shape, scale
    except Exception as e:
        console.print(f"[yellow]Warning: Error in tail risk estimation - {str(e)}[/yellow]")
        return None, None

def prepare_data_for_timeframe(df, timeframe_minutes):
    base_columns = ['price_change_5m', 'price_change_1h', 'volume_1h', 'volume_24h', 'pool_age_hours', 'market_cap', 'fdv']
    
    price_change_col = f'price_change_{timeframe_minutes}m'
    
    required_columns = base_columns + [price_change_col]
    
    df = df.copy()  # Create a copy to avoid SettingWithCopyWarning
    
    if price_change_col not in df.columns:
        df.loc[:, price_change_col] = df['price_change_24h'] * (timeframe_minutes / 1440)
    
    df.loc[:, 'effective_market_cap'] = df['market_cap'].fillna(df['fdv'])
    df.loc[:, 'effective_market_cap'] = df['effective_market_cap'].fillna(df['liquidity'] * 2)
    df.loc[:, 'effective_market_cap'] = df['effective_market_cap'].clip(lower=1000)
    
    df.loc[:, 'volume_1h'] = df['volume_1h'].clip(lower=0)
    df.loc[:, 'volume_24h'] = df['volume_24h'].clip(lower=0)
    
    df_prepared = df[required_columns + ['effective_market_cap']].dropna(subset=['effective_market_cap'])
    
    df_prepared = df_prepared[df_prepared['effective_market_cap'] >= 1000]
    
    df_prepared.loc[:, 'pool_age_hours'] = df_prepared['pool_age_hours'].clip(lower=0)
    
    if df_prepared.empty:
        log.warning(f"No valid data for {timeframe_minutes} minute timeframe after removing NaN values")
        return None
    
    return df_prepared

def calculate_price_range(timeframe_minutes, df_recent):
    # Calculate volatility based on recent price changes
    price_changes = df_recent['price_change_24h'].dropna()
    if len(price_changes) > 0:
        volatility = np.std(price_changes) * np.sqrt(1440 / timeframe_minutes)
    else:
        volatility = 0.1  # Default value if no data available

    # Determine price range based on volatility and timeframe
    if timeframe_minutes <= 60:  # Short timeframe
        if volatility < 0.05:
            return "Wide (~30% up/down)"
        elif volatility < 0.1:
            return "Medium (~17% up/down)"
        else:
            return "Narrow (~10% up/down)"
    elif timeframe_minutes <= 360:  # Medium timeframe
        if volatility < 0.1:
            return "Wide (~30% up/down)"
        elif volatility < 0.2:
            return "Medium (~17% up/down)"
        else:
            return "Narrow (~10% up/down)"
    else:  # Long timeframe
        if volatility < 0.15:
            return "Wide (~30% up/down)"
        elif volatility < 0.25:
            return "Medium (~17% up/down)"
        else:
            return "Narrow (~10% up/down)"

def get_current_recommendations(timeframe_minutes, mode, df_recent):
    log.info(f"Generating recommendations for {timeframe_minutes} minute timeframe in {mode} mode")
    
    try:
        df_prepared = prepare_data_for_timeframe(df_recent, timeframe_minutes)
        if df_prepared is None or df_prepared.empty:
            raise ValueError(f"Insufficient data for {timeframe_minutes} minute timeframe")
        
        risk_factors = {'degen': 1.5, 'moderate': 1.2, 'conservative': 1.0}
        risk_factor = risk_factors[mode]
        log.info(f"Applied risk factor: {risk_factor}")
        
        recommendations = {}
        explanations = {}
        
        # Market Cap calculation (fixed)
        valid_market_caps = df_prepared['effective_market_cap'][df_prepared['effective_market_cap'] < 100000000]
        raw_mcap = valid_market_caps.quantile(0.25)
        adjusted_mcap = raw_mcap * risk_factor
        final_mcap = max(round(adjusted_mcap, -3), 1000000)
        final_mcap = min(final_mcap, 30000000)
        recommendations['Min Token Market Cap'] = final_mcap
        explanations['Min Token Market Cap'] = f"""
        Raw 25th percentile: ${raw_mcap:,.0f}
        Risk-adjusted value: ${adjusted_mcap:,.0f}
        Minimum threshold: $1,000,000
        Maximum threshold: $30,000,000
        Final value: ${final_mcap:,.0f}
        """
        
        # Price change calculations
        price_change_col = f'price_change_{timeframe_minutes}m'
        if price_change_col not in df_prepared.columns:
            df_prepared[price_change_col] = df_prepared['price_change_24h'] * (timeframe_minutes / 1440)
        
        # 5M Price Change
        raw_value_5m = df_prepared[price_change_col].quantile(0.10) * (5 / timeframe_minutes)
        adjusted_value_5m = round(raw_value_5m * risk_factor, 2)
        recommendations['Min Token 5M Price Change (%)'] = adjusted_value_5m
        explanations['Min Token 5M Price Change (%)'] = f"""
        Raw 10th percentile (scaled to 5M): {raw_value_5m:.2f}%
        Risk adjustment: {risk_factor:.2f}x
        Final value: {adjusted_value_5m:.2f}%
        """
        
        # 1H Price Change
        raw_value_1h = df_prepared[price_change_col].quantile(0.10) * (60 / timeframe_minutes)
        adjusted_value_1h = round(raw_value_1h * risk_factor, 2)
        recommendations['Min Token 1H Price Change (%)'] = adjusted_value_1h
        explanations['Min Token 1H Price Change (%)'] = f"""
        Raw 10th percentile (scaled to 1H): {raw_value_1h:.2f}%
        Risk adjustment: {risk_factor:.2f}x
        Final value: {adjusted_value_1h:.2f}%
        """
        
        # Max 1H Price Change
        max_change = df_prepared[price_change_col].quantile(0.95) * (60 / timeframe_minutes)
        adjusted_max_change = min(round(max_change * risk_factor, 2), 500)
        recommendations['Max Token 1H Price Change (%)'] = adjusted_max_change
        explanations['Max Token 1H Price Change (%)'] = f"""
        Raw 95th percentile (scaled to 1H): {max_change:.2f}%
        Risk adjustment: {risk_factor:.2f}x
        Capped at 500%
        Final value: {adjusted_max_change:.2f}%
        """
        
        # Volume calculations
        volume_col = 'volume_1h' if timeframe_minutes <= 60 else 'volume_24h'
        raw_volume = df_prepared[volume_col].quantile(0.25)
        
        # 1H Volume
        scaled_volume_1h = raw_volume * (60 / (60 if volume_col == 'volume_1h' else 1440)) * (timeframe_minutes / 60)
        adjusted_volume_1h = round(scaled_volume_1h * risk_factor, -3)
        final_volume_1h = max(adjusted_volume_1h, 50000)
        recommendations['Min Token 1H Volume'] = final_volume_1h
        explanations['Min Token 1H Volume'] = f"""
        Raw 25th percentile (scaled to 1H): ${scaled_volume_1h:,.0f}
        Risk-adjusted value: ${adjusted_volume_1h:,.0f}
        Minimum threshold: $50,000
        Final value: ${final_volume_1h:,.0f}
        """
        
        # 24H Volume
        scaled_volume_24h = raw_volume * (1440 / (60 if volume_col == 'volume_1h' else 1440)) * (timeframe_minutes / 1440)
        adjusted_volume_24h = round(scaled_volume_24h * risk_factor, -3)
        final_volume_24h = max(adjusted_volume_24h, 1000000)
        recommendations['Min Token 24H Volume'] = final_volume_24h
        explanations['Min Token 24H Volume'] = f"""
        Raw 25th percentile (scaled to 24H): ${scaled_volume_24h:,.0f}
        Risk-adjusted value: ${adjusted_volume_24h:,.0f}
        Minimum threshold: $1,000,000
        Final value: ${final_volume_24h:,.0f}
        """
        
        # Token Age
        raw_age = df_prepared['pool_age_hours'].quantile(0.10)
        adjusted_age = round(max(raw_age * risk_factor, 0.1), 1)
        final_age = max(adjusted_age, timeframe_minutes / 60)
        recommendations['Min Token Age (hrs)'] = final_age
        explanations['Min Token Age (hrs)'] = f"""
        Raw 10th percentile: {raw_age:.1f} hours
        Risk-adjusted value: {adjusted_age:.1f} hours
        Minimum threshold: {timeframe_minutes / 60:.1f} hours
        Final value: {final_age:.1f} hours
        """
        
        # Dynamic Stop Loss
        volatility = df_prepared[price_change_col].std() * np.sqrt(1440 / timeframe_minutes)
        base_stop_loss = volatility * 2
        adjusted_stop_loss = base_stop_loss * (1 / risk_factor)  # Inverse risk factor for stop loss
        final_stop_loss = max(min(adjusted_stop_loss, 20), 5)
        recommendations['Dynamic Stop Loss (%)'] = -round(final_stop_loss, 2)
        explanations['Dynamic Stop Loss (%)'] = f"""
        Volatility (24h equivalent): {volatility:.2f}%
        Base stop loss (2x volatility): {base_stop_loss:.2f}%
        Risk-adjusted stop loss: {adjusted_stop_loss:.2f}%
        Final stop loss (capped between 5% and 20%): {final_stop_loss:.2f}%
        """
        
        # Calculate and add price range setting
        price_range = calculate_price_range(timeframe_minutes, df_recent)
        recommendations['Price Range Setting'] = price_range
        explanations['Price Range Setting'] = f"""
        Automatically determined based on timeframe ({timeframe_minutes} minutes) and current market volatility.
        Wide: Price can go up or down ~30% (Larger range to earn fees)
        Medium: Price can go up or down ~17%
        Narrow: Price can go up or down ~10% (Higher risk of full conversion)
        Selected: {price_range}
        """
        
        return recommendations, explanations
    
    except Exception as e:
        log.error(f"An error occurred while generating recommendations: {str(e)}")
        log.error(f"Traceback: {traceback.format_exc()}")
        return None, None

def prepare_data_for_ml():
    data_manager.load_data()
    df = data_manager.df.copy()
    
    features = ['market_cap', 'volume_24h', 'price_change_24h', 'transactions_24h_buys', 'transactions_24h_sells', 'pool_age_hours']
    
    for col in features:
        if col not in df.columns:
            df[col] = 0
        df[col] = pd.to_numeric(df[col], errors='coerce')
    
    df = df.dropna(subset=features)
    
    # Log market cap distribution before filtering
    market_cap_percentiles_before = df['market_cap'].quantile([0.1, 0.25, 0.5, 0.75, 0.9])
    console.print(f"[cyan]Market Cap Percentiles (Before Filtering):[/cyan]")
    for percentile, value in market_cap_percentiles_before.items():
        console.print(f"[cyan]{percentile*100}%: ${value:,.0f}[/cyan]")
    
    # Filter out high market cap tokens
    df = df[df['market_cap'] < 100000000]
    
    # Log market cap distribution after filtering
    market_cap_percentiles_after = df['market_cap'].quantile([0.1, 0.25, 0.5, 0.75, 0.9])
    console.print(f"[cyan]Market Cap Percentiles (After Filtering):[/cyan]")
    for percentile, value in market_cap_percentiles_after.items():
        console.print(f"[cyan]{percentile*100}%: ${value:,.0f}[/cyan]")
    
    # Calculate volatility (using 24h price change as a simple proxy)
    df['volatility'] = df['price_change_24h'].rolling(window=7).std()
    
    # Calculate dynamic stop loss (between -10% and -50%)
    df['dynamic_stop_loss'] = df['volatility'].clip(lower=10, upper=50) * -1
    
    df['volume_ratio'] = df['volume_24h'] / df['volume_24h'].rolling(window=24).mean()
    df['best_timeframe'] = np.clip(df['volume_ratio'] * 720, 30, 1440)
    df['min_token_5m_price_change'] = df['price_change_24h'] / (24 * 12)
    df['min_token_1h_price_change'] = df['price_change_24h'] / 24
    df['max_token_1h_price_change'] = df['price_change_24h'].rolling(window=24).max()
    df['min_token_1h_volume'] = df['volume_24h'] / 24
    df['min_token_24h_volume'] = df['volume_24h']
    df['min_token_market_cap'] = df['market_cap'].clip(upper=50000000)
    df['min_token_age'] = df['pool_age_hours']
    
    targets = ['best_timeframe', 'min_token_5m_price_change', 'min_token_1h_price_change', 
               'max_token_1h_price_change', 'min_token_1h_volume', 'min_token_24h_volume', 
               'min_token_market_cap', 'min_token_age', 'dynamic_stop_loss']
    
    df = df.dropna(subset=targets)
    
    for col in features + targets:
        console.print(f"[cyan]{col} - min: {df[col].min():.2f}, max: {df[col].max():.2f}, mean: {df[col].mean():.2f}[/cyan]")
    
    X = df[features].values
    y = df[targets].values
    
    scaler = StandardScaler()
    X_scaled = scaler.fit_transform(X)
    
    X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)
    
    return (X_train, X_test, y_train, y_test), targets, scaler

def train_random_forest():
    try:
        (X_train, X_test, y_train, y_test), target_names, scaler = prepare_data_for_ml()
        
        model = RandomForestRegressor(n_estimators=100, max_depth=10, random_state=42)
        model.fit(X_train, y_train)
        
        y_pred = model.predict(X_test)
        mse = mean_squared_error(y_test, y_pred, multioutput='raw_values')
        r2 = r2_score(y_test, y_pred, multioutput='raw_values')
        
        console.print(f"[green]Random Forest Model Trained:[/green]")
        for i, target in enumerate(target_names):
            console.print(f"{target} - MSE: {mse[i]:.4f}, R-squared: {r2[i]:.4f}")
        
        return model, target_names, scaler
    except Exception as e:
        console.print(f"[bold red]Error in training Random Forest: {str(e)}[/bold red]")
        console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")
        return None, None, None

def generate_ml_recommendations(model, target_names, scaler):
    try:
        recent_data = data_manager.get_recent_data().iloc[-1]
        
        features = ['market_cap', 'volume_24h', 'price_change_24h', 'transactions_24h_buys', 'transactions_24h_sells', 'pool_age_hours']
        X = recent_data[features].values.reshape(1, -1)
        
        X_scaled = scaler.transform(X)
        
        predictions = model.predict(X_scaled)[0]
        
        recommendations = {target: max(0, pred) if 'stop_loss' not in target else pred for target, pred in zip(target_names, predictions)}
        
        # Ensure stop loss is within -10% to -50% range
        if 'dynamic_stop_loss' in recommendations:
            recommendations['dynamic_stop_loss'] = max(-50, min(-10, recommendations['dynamic_stop_loss']))
        
        return recommendations
    except Exception as e:
        console.print(f"[bold red]Error in generating ML recommendations: {str(e)}[/bold red]")
        console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")
        return None

def print_logo():
    logo = r"""
__| |____________________________________________________| |__
__   ____________________________________________________   __
  | |                                                    | |  
  | |____ ____ _       ___  ____ ____ ____ ___  ____ ____| |  
  | |[__  |  | |       |  \ |___ |    |  | |  \ |___ |__/| |  
  | |___] |__| |___    |__/ |___ |___ |__| |__/ |___ |  \| |  
__| |____________________________________________________| |__
__   ____________________________________________________   __
  | |                                                    | |  
"""
    print(logo)

def print_cyberpunk_header():
    print_logo()
    print(f"\n{Fore.GREEN}{'=' * 80}")
    print(f"{Fore.YELLOW}                         DLMM Settings Script v1.0")
    print(f"{Fore.CYAN}                     made with <3 by @mining helium")
    print(f"{Fore.GREEN}{'=' * 80}\n")

def print_menu():
    print(f"{Fore.CYAN}[R] {Fore.MAGENTA}Get Recommendations")
    print(f"{Fore.CYAN}[T] {Fore.MAGENTA}Get Timeframe")
    print(f"{Fore.CYAN}[P] {Fore.MAGENTA}Pull Data")
    print(f"{Fore.CYAN}[Q] {Fore.MAGENTA}Quit")
    print(f"\n{Fore.GREEN}{'=' * 80}")

def r_command():
    print(f"\n{Fore.YELLOW}[SYS] Executing Recommendation Algorithm...")
    data_manager.load_data()
    df_recent = data_manager.get_recent_data()
    timeframe_minutes = get_user_input("Select your timeframe for LP pool:", 
                                       {'1': 30, '2': 60, '3': 120, '4': 180, '5': 360, '6': 720, '7': 1440})
    mode = get_user_input("Choose your preferred mode:", 
                          {'1': 'degen', '2': 'moderate', '3': 'conservative'})
    try:
        recommendations, explanations = get_current_recommendations(timeframe_minutes, mode, df_recent)
        
        if recommendations and explanations:
            display_recommendations(recommendations, explanations)
            save_recommendations(recommendations, explanations)
            print(f"{Fore.GREEN}[SYS] Recommendations generated successfully!")
        else:
            console.print("[red]No recommendations or explanations generated.[/red]")
    except Exception as e:
        console.print(f"[red]An error occurred: {str(e)}[/red]")
        console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")

def display_recommendations(recommendations, explanations):
    console.print(f"\n[bold green]Optimized DLMM Entry Criteria:[/bold green]")
    for setting, value in recommendations.items():
        if 'Volume' in setting or 'Market Cap' in setting:
            formatted_value = f"${value:,.0f}"
        elif 'Age' in setting:
            formatted_value = f"{value:.1f} hours"
        elif 'Tail Risk' in setting or 'Pattern Index' in setting:
            formatted_value = f"{value:.4f}"
        elif setting == 'Price Range Setting':
            formatted_value = value
        else:
            formatted_value = f"{value:.2f}%"
        console.print(f"[cyan]{setting}:[/cyan] {formatted_value}")
        console.print(f"[yellow]{explanations[setting]}[/yellow]\n")

def main():
    console.print(Panel(Text("DLMM Data Collector", style="bold magenta")))
    log.info("Script started. Data collection will begin shortly.")
    try:
        print_cyberpunk_header()
        while True:
            print_menu()
            choice = input(f"{Fore.YELLOW}[SYS] Enter your choice: ").lower()
            
            if choice == 'r':
                r_command()
            elif choice == 't':
                t_command()
            elif choice == 'p':
                pull_data()
            elif choice == 'q':
                console.print(Panel(Text("Script terminated by user.", style="bold red")))
                log.info("Script terminated by user.")
                break
            else:
                print(f"{Fore.RED}[ERROR] Invalid choice. Please try again.")
    except KeyboardInterrupt:
        console.print(Panel(Text("Script terminated by user.", style="bold red")))
        log.info("Script terminated by user.")
    except Exception as e:
        console.print(Panel(Text(f"An unexpected error occurred: {str(e)}", style="bold red")))
        log.error(f"An unexpected error occurred: {str(e)}")
        log.error(traceback.format_exc())

def t_command():
    print(f"\n{Fore.YELLOW}[SYS] Analyzing Optimal Timeframes...")
    console.print("[bold cyan]Training Random Forest model...[/bold cyan]")
    ml_model, target_names, scaler = train_random_forest()
    if ml_model is not None:
        recommendations = generate_ml_recommendations(ml_model, target_names, scaler)
        if recommendations:
            timeframe_options = [30, 60, 120, 180, 360, 720, 1440]
            best_timeframe = recommendations['best_timeframe']
            closest_timeframe = min(timeframe_options, key=lambda x: abs(x - best_timeframe))
            
            console.print("\n[bold green]Timeframe Analysis Results:[/bold green]")
            console.print(f"[cyan]Recommended Timeframe:[/cyan] {closest_timeframe} minutes")
            console.print(f"[yellow](ML suggestion: {best_timeframe:.0f} minutes)[/yellow]")
            
            console.print("\n[bold green]Predicted Metrics for Recommended Timeframe:[/bold green]")
            metrics_to_show = [
                ('Min Token 5M Price Change (%)', 'min_token_5m_price_change', '%'),
                ('Min Token 1H Price Change (%)', 'min_token_1h_price_change', '%'),
                ('Max Token 1H Price Change (%)', 'max_token_1h_price_change', '%'),
                ('Min Token 1H Volume', 'min_token_1h_volume', '$'),
                ('Min Token 24H Volume', 'min_token_24h_volume', '$'),
                ('Min Token Effective Market Cap', 'min_token_market_cap', '$'),
                ('Min Token Age (hrs)', 'min_token_age', 'hours'),
                ('Dynamic Stop Loss (%)', 'dynamic_stop_loss', '%')
            ]
            
            for label, metric, unit in metrics_to_show:
                if metric in recommendations:
                    value = recommendations[metric]
                    if unit == '$':
                        formatted_value = f"${value:,.0f}"
                    elif unit == 'hours':
                        formatted_value = f"{value:.1f} hours"
                    elif unit == '%':
                        formatted_value = f"{value:.2f}%"
                    else:
                        formatted_value = f"{value:.4f}"
                    console.print(f"[cyan]{label}:[/cyan] {formatted_value}")
                else:
                    console.print(f"[cyan]{label}:[/cyan] Not available")
            
            console.print("\n[bold yellow]Note:[/bold yellow] These are ML-based predictions for the recommended timeframe.")
            console.print("[bold yellow]The Dynamic Stop Loss is based on recent market volatility and should be used as a guideline.[/bold yellow]")
            console.print("[bold yellow]Use the 'R' command with your chosen timeframe for detailed entry criteria and explanations.[/bold yellow]")
    
    print(f"{Fore.GREEN}[SYS] Timeframe analysis complete!")

def pull_data():
    global global_state
    print(f"\n{Fore.YELLOW}[SYS] Initiating Data Pull Sequence...")
    try:
        with data_pull_lock:
            collect_data()
            global_state.last_pull_time = datetime.now()
            print(f"{Fore.GREEN}[SYS] Data successfully extracted and processed!")
    except Exception as e:
        print(f"{Fore.RED}[ERROR] Data pull failed: {str(e)}")
        console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")
    print(f"{Fore.CYAN}[INFO] Last pull time: {global_state.last_pull_time.strftime('%Y-%m-%d %H:%M:%S')}")


def background_data_pull():
    global global_state
    while True:
        try:
            current_time = datetime.now()
            time_since_last_pull = current_time - global_state.last_pull_time

            if time_since_last_pull >= timedelta(minutes=30):
                print(f"\n{Fore.MAGENTA}[BACKGROUND] {Fore.YELLOW}Executing scheduled data pull...")
                pull_data()  # This function now uses the lock

            time.sleep(60)  # Check every minute
        except Exception as e:
            print(f"{Fore.RED}[ERROR] Background data pull error: {str(e)}")
            console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")
            time.sleep(60)  # Wait a minute before trying again


def display_last_pull_time():
    global global_state
    time_since_last_pull = datetime.now() - global_state.last_pull_time
    minutes, seconds = divmod(time_since_last_pull.seconds, 60)
    print(f"{Fore.CYAN}[INFO] Last data pull: {minutes} minutes and {seconds} seconds ago")
    print(f"{Fore.CYAN}[INFO] Next scheduled pull in: {max(0, 30 - minutes)} minutes")

def get_user_input(prompt, options):
    while True:
        console.print(f"\n[bold cyan]{prompt}[/bold cyan]")
        for key, value in options.items():
            console.print(f"{key}. {value}")
        
        choice = console.input("Enter your choice: ")
        if choice in options:
            return options[choice]
        else:
            console.print("[red]Invalid choice. Please try again.[/red]")

def display_recommendations(recommendations, explanations):
    console.print(f"\n[bold green]Optimized DLMM Entry Criteria:[/bold green]")
    for setting, value in recommendations.items():
        if 'Volume' in setting or 'Market Cap' in setting:
            formatted_value = f"${value:,.0f}"
        elif 'Age' in setting:
            formatted_value = f"{value:.1f} hours"
        elif 'Tail Risk' in setting or 'Pattern Index' in setting:
            formatted_value = f"{value:.4f}"
        elif setting == 'Price Range Setting':
            formatted_value = value
        else:
            formatted_value = f"{value:.2f}%"
        console.print(f"[cyan]{setting}:[/cyan] {formatted_value}")
        console.print(f"[yellow]{explanations[setting]}[/yellow]\n")

def save_recommendations(recommendations, explanations):
    if isinstance(recommendations, dict) and isinstance(explanations, dict):
        data_to_save = {
            "timestamp": datetime.now().isoformat(),
            "recommendations": recommendations,
            "explanations": explanations
        }
        
        filename = 'dlmm_recommendations.json'
        with open(filename, 'w') as f:
            json.dump(data_to_save, f, indent=4, cls=NumpyEncoder)
        console.print(f"\n[green]Recommendations and explanations saved to {filename}[/green]")
    else:
        console.print("\n[yellow]No recommendations or explanations to save.[/yellow]")

def main():
    global global_state
    
    # Start background data pull
    bg_thread = threading.Thread(target=background_data_pull, daemon=True)
    bg_thread.start()

    while True:
        try:
            print_cyberpunk_header()
            print_menu()
            display_last_pull_time()
            choice = input(f"{Fore.CYAN}[USER] Enter your choice: {Fore.WHITE}").lower()

            if choice == 'r':
                r_command()
            elif choice == 't':
                t_command()
            elif choice == 'p':
                pull_data()
            elif choice == 'q':
                print(f"\n{Fore.YELLOW}[SYS] Exiting SOL DECODER. Stay rad in cyberspace!")
                break
            else:
                print(f"\n{Fore.RED}[ERROR] Invalid choice. Please try again.")
        except Exception as e:
            console.print(f"[bold red]An error occurred: {str(e)}[/bold red]")
            console.print(f"[red]Traceback: {traceback.format_exc()}[/red]")
        
        input(f"\n{Fore.GREEN}[SYS] Press Enter to continue...")

try:
    main()
except KeyboardInterrupt:
    console.print(Panel(Text("Script terminated by user.", style="bold red")))

if __name__ == "__main__":
    console.print(Panel(Text("DLMM Data Collector", style="bold magenta")))
    log.info("Script started. Data collection will begin shortly.")
    try:
        main()
    except KeyboardInterrupt:
        console.print(Panel(Text("Script terminated by user.", style="bold red")))
        log.info("Script terminated by user.")
    except Exception as e:
        console.print(Panel(Text(f"An unexpected error occurred: {str(e)}", style="bold red")))
        log.error(f"An unexpected error occurred: {str(e)}")
        log.error(traceback.format_exc())