gogo2/core/enhanced_orchestrator.py

"""
Enhanced Trading Orchestrator - Advanced Multi-Modal Decision Making

This enhanced orchestrator implements:
1. Multi-timeframe CNN predictions with individual confidence scores
2. Advanced RL feedback loop for continuous learning
3. Multi-symbol (ETH, BTC) coordinated decision making
4. Perfect move marking for CNN backpropagation training
5. Market environment adaptation through RL evaluation
6. Universal data format compliance (5 timeseries streams)
"""

import asyncio
import logging
import time
import numpy as np
import pandas as pd
from datetime import datetime, timedelta
from typing import Dict, List, Optional, Tuple, Any, Union
from dataclasses import dataclass, field
from collections import deque
import torch
import ta

from .config import get_config
from .data_provider import DataProvider, RawTick, OHLCVBar, MarketTick
from .universal_data_adapter import UniversalDataAdapter, UniversalDataStream
from .realtime_tick_processor import RealTimeTickProcessor, ProcessedTickFeatures, integrate_with_orchestrator
from models import get_model_registry, ModelInterface, CNNModelInterface, RLAgentInterface
from .extrema_trainer import ExtremaTrainer
from .trading_action import TradingAction
from .negative_case_trainer import NegativeCaseTrainer
from .trading_executor import TradingExecutor
from .cnn_monitor import log_cnn_prediction, start_cnn_training_session
# Enhanced pivot RL trainer functionality integrated into orchestrator

logger = logging.getLogger(__name__)

@dataclass
class TimeframePrediction:
    """CNN prediction for a specific timeframe with confidence"""
    timeframe: str
    action: str  # 'BUY', 'SELL', 'HOLD'
    confidence: float  # 0.0 to 1.0
    probabilities: Dict[str, float]  # Action probabilities
    timestamp: datetime
    market_features: Dict[str, float] = field(default_factory=dict)  # Additional context

@dataclass
class EnhancedPrediction:
    """Enhanced prediction structure with timeframe breakdown"""
    symbol: str
    timeframe_predictions: List[TimeframePrediction]
    overall_action: str
    overall_confidence: float
    model_name: str
    timestamp: datetime
    metadata: Dict[str, Any] = field(default_factory=dict)

@dataclass
class TradingAction:
    """Represents a trading action with full context"""
    symbol: str
    action: str  # 'BUY', 'SELL', 'HOLD'
    quantity: float
    confidence: float
    price: float
    timestamp: datetime
    reasoning: Dict[str, Any]
    timeframe_analysis: List[TimeframePrediction]

@dataclass
class MarketState:
    """Complete market state for RL evaluation with comprehensive data"""
    symbol: str
    timestamp: datetime
    prices: Dict[str, float]  # {timeframe: current_price}
    features: Dict[str, np.ndarray]  # {timeframe: feature_matrix}
    volatility: float
    volume: float
    trend_strength: float
    market_regime: str  # 'trending', 'ranging', 'volatile'
    universal_data: UniversalDataStream  # Universal format data

    # Enhanced data for comprehensive RL state building
    raw_ticks: List[Dict[str, Any]] = field(default_factory=list)  # Last 300s of tick data
    ohlcv_data: Dict[str, List[Dict[str, Any]]] = field(default_factory=dict)  # Multi-timeframe OHLCV
    btc_reference_data: Dict[str, List[Dict[str, Any]]] = field(default_factory=dict)  # BTC correlation data
    cnn_hidden_features: Optional[Dict[str, np.ndarray]] = None  # CNN hidden layer features
    cnn_predictions: Optional[Dict[str, np.ndarray]] = None  # CNN predictions by timeframe
    pivot_points: Optional[Dict[str, Any]] = None  # Williams market structure data
    market_microstructure: Dict[str, Any] = field(default_factory=dict)  # Tick-level patterns

@dataclass
class PerfectMove:
    """Marked perfect move for CNN training"""
    symbol: str
    timeframe: str
    timestamp: datetime
    optimal_action: str
    actual_outcome: float  # Price change percentage
    market_state_before: MarketState
    market_state_after: MarketState
    confidence_should_have_been: float

@dataclass
class TradeInfo:
    """Information about an active trade"""
    symbol: str
    side: str  # 'LONG' or 'SHORT'
    entry_price: float
    entry_time: datetime
    size: float
    confidence: float
    market_state: Dict[str, Any]

@dataclass
class LearningCase:
    """A learning case for DQN sensitivity training"""
    state_vector: np.ndarray
    action: int  # sensitivity level chosen
    reward: float
    next_state_vector: np.ndarray
    done: bool
    trade_info: TradeInfo
    outcome: float  # P&L percentage

class EnhancedTradingOrchestrator:
    """
    Enhanced orchestrator with sophisticated multi-modal decision making
    and universal data format compliance
    """

    def __init__(self,
                 data_provider: DataProvider = None,
                 symbols: List[str] = None,
                 enhanced_rl_training: bool = True,
                 model_registry: Dict = None):
        """Initialize the enhanced orchestrator with 2-action system"""
        self.config = get_config()
        self.data_provider = data_provider or DataProvider()
        self.model_registry = model_registry or get_model_registry()

        # Enhanced RL training integration
        self.enhanced_rl_training = enhanced_rl_training

        # Override symbols if provided
        if symbols:
            self.symbols = symbols
        else:
            self.symbols = self.config.symbols

        logger.info(f"Enhanced orchestrator initialized with symbols: {self.symbols}")
        logger.info("2-Action System: BUY/SELL with intelligent position management")
        if self.enhanced_rl_training:
            logger.info("Enhanced RL training enabled")

        # Position tracking for 2-action system
        self.current_positions = {}  # symbol -> {'side': 'LONG'|'SHORT'|'FLAT', 'entry_price': float, 'timestamp': datetime}
        self.last_signals = {}  # symbol -> {'action': 'BUY'|'SELL', 'timestamp': datetime, 'confidence': float}

        # Pivot-based dynamic thresholds (simplified without external trainer)
        self.entry_threshold = 0.7  # Higher threshold for entries
        self.exit_threshold = 0.3   # Lower threshold for exits
        self.uninvested_threshold = 0.4  # Stay out threshold

        logger.info(f"Pivot-Based Thresholds:")
        logger.info(f"  Entry threshold: {self.entry_threshold:.3f} (more certain)")
        logger.info(f"  Exit threshold: {self.exit_threshold:.3f} (easier to exit)")
        logger.info(f"  Uninvested threshold: {self.uninvested_threshold:.3f} (stay out when uncertain)")

        # Initialize universal data adapter
        self.universal_adapter = UniversalDataAdapter(self.data_provider)

        # Initialize real-time tick processor for ultra-low latency processing
        self.tick_processor = RealTimeTickProcessor(symbols=self.config.symbols)

        # Initialize extrema trainer for local bottom/top detection and 200-candle context
        self.extrema_trainer = ExtremaTrainer(
            data_provider=self.data_provider,
            symbols=self.config.symbols,
            window_size=10  # 10-candle window for extrema detection
        )

        # Initialize negative case trainer for intensive training on losing trades
        self.negative_case_trainer = NegativeCaseTrainer()

        # Real-time tick features storage
        self.realtime_tick_features = {symbol: deque(maxlen=100) for symbol in self.config.symbols}

        # Multi-symbol configuration
        self.timeframes = self.config.timeframes

        # Configuration with different thresholds for opening vs closing
        self.confidence_threshold_open = self.config.orchestrator.get('confidence_threshold', 0.6)
        self.confidence_threshold_close = self.config.orchestrator.get('confidence_threshold_close', 0.25)  # Much lower for closing
        self.decision_frequency = self.config.orchestrator.get('decision_frequency', 30)

        # DQN RL-based sensitivity learning parameters
        self.sensitivity_learning_enabled = True
        self.sensitivity_dqn_agent = None  # Will be initialized when first DQN model is available
        self.sensitivity_state_size = 20  # Features for sensitivity learning
        self.sensitivity_action_space = 5  # 5 sensitivity levels: very_low, low, medium, high, very_high
        self.current_sensitivity_level = 2  # Start with medium (index 2)
        self.sensitivity_levels = {
            0: {'name': 'very_low', 'close_threshold_multiplier': 0.5, 'open_threshold_multiplier': 1.2},
            1: {'name': 'low', 'close_threshold_multiplier': 0.7, 'open_threshold_multiplier': 1.1},
            2: {'name': 'medium', 'close_threshold_multiplier': 1.0, 'open_threshold_multiplier': 1.0},
            3: {'name': 'high', 'close_threshold_multiplier': 1.3, 'open_threshold_multiplier': 0.9},
            4: {'name': 'very_high', 'close_threshold_multiplier': 1.5, 'open_threshold_multiplier': 0.8}
        }

        # Trade tracking for sensitivity learning
        self.active_trades = {}  # symbol -> trade_info with entry details
        self.completed_trades = deque(maxlen=1000)  # Store last 1000 completed trades for learning
        self.sensitivity_learning_queue = deque(maxlen=500)  # Queue for DQN training

        # Enhanced weighting system
        self.timeframe_weights = self._initialize_timeframe_weights()
        self.symbol_correlation_matrix = self._initialize_correlation_matrix()

        # State tracking for each symbol
        self.symbol_states = {symbol: {} for symbol in self.symbols}
        self.recent_actions = {symbol: deque(maxlen=100) for symbol in self.symbols}
        self.market_states = {symbol: deque(maxlen=1000) for symbol in self.symbols}

        # Perfect move tracking for CNN training with enhanced retrospective learning
        self.perfect_moves = deque(maxlen=10000)
        self.performance_tracker = {}
        self.retrospective_learning_active = False
        self.last_retrospective_analysis = datetime.now()

        # Local extrema tracking for training on bottoms and tops
        self.local_extrema = {symbol: deque(maxlen=1000) for symbol in self.symbols}
        self.extrema_detection_window = 10  # Look for extrema in 10-candle windows
        self.extrema_training_queue = deque(maxlen=500)  # Queue for extrema-based training
        self.last_extrema_check = {symbol: datetime.now() for symbol in self.symbols}

        # 200-candle context data for models
        self.context_data_1m = {symbol: deque(maxlen=200) for symbol in self.symbols}
        self.context_features_1m = {symbol: None for symbol in self.symbols}
        self.context_update_frequency = 60  # Update context every 60 seconds
        self.last_context_update = {symbol: datetime.now() for symbol in self.symbols}

        # RL feedback system
        self.rl_evaluation_queue = deque(maxlen=1000)
        self.environment_adaptation_rate = 0.01

        # Decision callbacks
        self.decision_callbacks = []
        self.learning_callbacks = []

        # Integrate tick processor with orchestrator
        integrate_with_orchestrator(self, self.tick_processor)

        # Subscribe to raw tick data and OHLCV bars from data provider
        self.raw_tick_subscriber_id = self.data_provider.subscribe_to_raw_ticks(self._handle_raw_tick)
        self.ohlcv_bar_subscriber_id = self.data_provider.subscribe_to_ohlcv_bars(self._handle_ohlcv_bar)

        # Raw tick and OHLCV data storage for models
        self.raw_tick_buffers = {symbol: deque(maxlen=1000) for symbol in self.symbols}
        self.ohlcv_bar_buffers = {symbol: deque(maxlen=3600) for symbol in self.symbols}  # 1 hour of 1s bars

        # Pattern-based decision enhancement
        self.pattern_weights = {
            'rapid_fire': 1.5,
            'volume_spike': 1.3,
            'price_acceleration': 1.4,
            'high_frequency_bar': 1.2,
            'volume_concentration': 1.1
        }

        # Initialize 200-candle context data
        self._initialize_context_data()

        logger.info("Enhanced TradingOrchestrator initialized with Universal Data Format")
        logger.info(f"Symbols: {self.symbols}")
        logger.info(f"Timeframes: {self.timeframes}")
        logger.info(f"Universal format: ETH ticks, 1m, 1h, 1d + BTC reference ticks")
        logger.info(f"Opening confidence threshold: {self.confidence_threshold_open}")
        logger.info(f"Closing confidence threshold: {self.confidence_threshold_close}")
        logger.info("Real-time tick processor integrated for ultra-low latency processing")
        logger.info("Raw tick and OHLCV bar processing enabled for pattern detection")
        logger.info("Enhanced retrospective learning enabled for perfect opportunity detection")
        logger.info("DQN RL-based sensitivity learning enabled for adaptive thresholds")
        logger.info("Local extrema detection enabled for bottom/top training")
        logger.info("200-candle 1m context data initialized for enhanced model performance")

    def _initialize_timeframe_weights(self) -> Dict[str, float]:
        """Initialize weights for different timeframes"""
        # Higher timeframes get more weight for trend direction
        # Lower timeframes get more weight for entry/exit timing
        base_weights = {
            '1s': 0.60,   # Primary scalping signal (ticks)
            '1m': 0.20,   # Short-term confirmation
            '5m': 0.10,   # Short-term momentum
            '15m': 0.15,  # Entry/exit timing
            '1h': 0.15,   # Medium-term trend
            '4h': 0.25,   # Stronger trend confirmation
            '1d': 0.05    # Long-term direction (minimal for scalping)
        }

        # Normalize weights for configured timeframes
        configured_weights = {tf: base_weights.get(tf, 0.1) for tf in self.timeframes}
        total = sum(configured_weights.values())
        return {tf: w/total for tf, w in configured_weights.items()}

    def _initialize_correlation_matrix(self) -> Dict[Tuple[str, str], float]:
        """Initialize correlation matrix between symbols"""
        correlations = {}
        for i, symbol1 in enumerate(self.symbols):
            for j, symbol2 in enumerate(self.symbols):
                if i != j:
                    # ETH and BTC are typically highly correlated
                    if 'ETH' in symbol1 and 'BTC' in symbol2:
                        correlations[(symbol1, symbol2)] = 0.85
                    elif 'BTC' in symbol1 and 'ETH' in symbol2:
                        correlations[(symbol1, symbol2)] = 0.85
                    else:
                        correlations[(symbol1, symbol2)] = 0.7  # Default correlation
        return correlations

    async def make_coordinated_decisions(self) -> Dict[str, Optional[TradingAction]]:
        """
        Make coordinated trading decisions across all symbols using universal data format
        """
        decisions = {}

        try:
            # Get universal data stream (5 timeseries)
            universal_stream = self.universal_adapter.get_universal_data_stream()

            if universal_stream is None:
                logger.warning("Failed to get universal data stream")
                return decisions

            # Validate universal format
            is_valid, issues = self.universal_adapter.validate_universal_format(universal_stream)
            if not is_valid:
                logger.warning(f"Universal data format validation failed: {issues}")
                return decisions

            logger.info("UNIVERSAL DATA STREAM ACTIVE:")
            logger.info(f"  ETH ticks: {len(universal_stream.eth_ticks)} samples")
            logger.info(f"  ETH 1m: {len(universal_stream.eth_1m)} candles")
            logger.info(f"  ETH 1h: {len(universal_stream.eth_1h)} candles")
            logger.info(f"  ETH 1d: {len(universal_stream.eth_1d)} candles")
            logger.info(f"  BTC reference: {len(universal_stream.btc_ticks)} samples")
            logger.info(f"  Data quality: {universal_stream.metadata['data_quality']['overall_score']:.2f}")

            # Get market states for all symbols using universal data
            market_states = await self._get_all_market_states_universal(universal_stream)

            # Get enhanced predictions for all symbols
            symbol_predictions = {}
            for symbol in self.symbols:
                if symbol in market_states:
                    predictions = await self._get_enhanced_predictions_universal(
                        symbol, market_states[symbol], universal_stream
                    )
                    symbol_predictions[symbol] = predictions

            # Coordinate decisions considering symbol correlations
            for symbol in self.symbols:
                if symbol in symbol_predictions:
                    decision = await self._make_coordinated_decision(
                        symbol,
                        symbol_predictions[symbol],
                        symbol_predictions,
                        market_states[symbol]
                    )
                    decisions[symbol] = decision

                    # Queue for RL evaluation
                    if decision and decision.action != 'HOLD':
                        self._queue_for_rl_evaluation(decision, market_states[symbol])

        except Exception as e:
            logger.error(f"Error in coordinated decision making: {e}")

        return decisions

    async def _get_all_market_states_universal(self, universal_stream: UniversalDataStream) -> Dict[str, MarketState]:
        """Get market states for all symbols with comprehensive data for RL"""
        market_states = {}

        for symbol in self.symbols:
            try:
                # Basic market state data
                current_prices = {}
                for timeframe in self.timeframes:
                    # Get latest price from universal data stream
                    latest_price = self._get_latest_price_from_universal(symbol, timeframe, universal_stream)
                    if latest_price:
                        current_prices[timeframe] = latest_price

                # Calculate basic metrics
                volatility = self._calculate_volatility_from_universal(symbol, universal_stream)
                volume = self._calculate_volume_from_universal(symbol, universal_stream)
                trend_strength = self._calculate_trend_strength_from_universal(symbol, universal_stream)
                market_regime = self._determine_market_regime(symbol, universal_stream)

                # Get comprehensive data for RL state building
                raw_ticks = self._get_recent_tick_data_for_rl(symbol)
                ohlcv_data = self._get_multiframe_ohlcv_for_rl(symbol)
                btc_reference_data = self._get_multiframe_ohlcv_for_rl('BTC/USDT')

                # Get CNN features if available
                cnn_hidden_features, cnn_predictions = self._get_cnn_features_for_rl(symbol)

                # Calculate pivot points
                pivot_points = self._calculate_pivot_points_for_rl(ohlcv_data)

                # Analyze market microstructure
                market_microstructure = self._analyze_market_microstructure(raw_ticks)

                # Create comprehensive market state
                market_state = MarketState(
                    symbol=symbol,
                    timestamp=datetime.now(),
                    prices=current_prices,
                    features={},  # Will be populated by feature extraction
                    volatility=volatility,
                    volume=volume,
                    trend_strength=trend_strength,
                    market_regime=market_regime,
                    universal_data=universal_stream,
                    raw_ticks=raw_ticks,
                    ohlcv_data=ohlcv_data,
                    btc_reference_data=btc_reference_data,
                    cnn_hidden_features=cnn_hidden_features,
                    cnn_predictions=cnn_predictions,
                    pivot_points=pivot_points,
                    market_microstructure=market_microstructure
                )

                market_states[symbol] = market_state
                logger.debug(f"Created comprehensive market state for {symbol} with {len(raw_ticks)} ticks")

            except Exception as e:
                logger.error(f"Error creating market state for {symbol}: {e}")

        return market_states

    def _get_recent_tick_data_for_rl(self, symbol: str, seconds: int = 300) -> List[Dict[str, Any]]:
        """Get recent tick data for RL state building"""
        try:
            # Get ticks from data provider
            recent_ticks = self.data_provider.get_recent_ticks(symbol, count=seconds * 10)

            # Convert to required format
            tick_data = []
            for tick in recent_ticks[-300:]:  # Last 300 ticks max (300s at ~1 tick/sec)
                tick_dict = {
                    'timestamp': tick.timestamp,
                    'price': tick.price,
                    'volume': tick.volume,
                    'quantity': getattr(tick, 'quantity', tick.volume),
                    'side': getattr(tick, 'side', 'unknown'),
                    'trade_id': getattr(tick, 'trade_id', 'unknown'),
                    'is_buyer_maker': getattr(tick, 'is_buyer_maker', False)
                }
                tick_data.append(tick_dict)

            return tick_data

        except Exception as e:
            logger.warning(f"Error getting tick data for {symbol}: {e}")
            return []

    def _get_multiframe_ohlcv_for_rl(self, symbol: str) -> Dict[str, List[Dict[str, Any]]]:
        """Get multi-timeframe OHLCV data for RL state building"""
        try:
            ohlcv_data = {}
            timeframes = ['1s', '1m', '1h', '1d']

            for tf in timeframes:
                try:
                    # Get historical data for timeframe
                    df = self.data_provider.get_historical_data(
                        symbol=symbol,
                        timeframe=tf,
                        limit=300,
                        refresh=True
                    )

                    if df is not None and not df.empty:
                        # Convert to list of dictionaries with technical indicators
                        bars = []

                        # Add technical indicators
                        df_with_indicators = self._add_technical_indicators(df)

                        for idx, row in df_with_indicators.tail(300).iterrows():
                            bar = {
                                'timestamp': idx if hasattr(idx, 'timestamp') else datetime.now(),
                                'open': float(row.get('open', 0)),
                                'high': float(row.get('high', 0)),
                                'low': float(row.get('low', 0)),
                                'close': float(row.get('close', 0)),
                                'volume': float(row.get('volume', 0)),
                                'rsi': float(row.get('rsi', 50)),
                                'macd': float(row.get('macd', 0)),
                                'bb_upper': float(row.get('bb_upper', row.get('close', 0))),
                                'bb_lower': float(row.get('bb_lower', row.get('close', 0))),
                                'sma_20': float(row.get('sma_20', row.get('close', 0))),
                                'ema_12': float(row.get('ema_12', row.get('close', 0))),
                                'atr': float(row.get('atr', 0))
                            }
                            bars.append(bar)

                        ohlcv_data[tf] = bars
                    else:
                        ohlcv_data[tf] = []

                except Exception as e:
                    logger.warning(f"Error getting {tf} data for {symbol}: {e}")
                    ohlcv_data[tf] = []

            return ohlcv_data

        except Exception as e:
            logger.warning(f"Error getting OHLCV data for {symbol}: {e}")
            return {}

    def _add_technical_indicators(self, df: pd.DataFrame) -> pd.DataFrame:
        """Add technical indicators to OHLCV data"""
        try:
            df = df.copy()

            # RSI
            if len(df) >= 14:
                df['rsi'] = ta.momentum.rsi(df['close'], window=14)
            else:
                df['rsi'] = 50

            # MACD
            if len(df) >= 26:
                macd = ta.trend.macd_diff(df['close'])
                df['macd'] = macd
            else:
                df['macd'] = 0

            # Bollinger Bands
            if len(df) >= 20:
                bb = ta.volatility.BollingerBands(df['close'], window=20)
                df['bb_upper'] = bb.bollinger_hband()
                df['bb_lower'] = bb.bollinger_lband()
            else:
                df['bb_upper'] = df['close']
                df['bb_lower'] = df['close']

            # Moving Averages
            if len(df) >= 20:
                df['sma_20'] = ta.trend.sma_indicator(df['close'], window=20)
            else:
                df['sma_20'] = df['close']

            if len(df) >= 12:
                df['ema_12'] = ta.trend.ema_indicator(df['close'], window=12)
            else:
                df['ema_12'] = df['close']

            # ATR
            if len(df) >= 14:
                df['atr'] = ta.volatility.average_true_range(df['high'], df['low'], df['close'], window=14)
            else:
                df['atr'] = 0

            return df

        except Exception as e:
            logger.warning(f"Error adding technical indicators: {e}")
            return df

    def _get_cnn_features_for_rl(self, symbol: str) -> Tuple[Optional[Dict[str, np.ndarray]], Optional[Dict[str, np.ndarray]]]:
        """Get CNN hidden features and predictions for RL state building"""
        try:
            # Try to get CNN features from model registry
            if hasattr(self, 'model_registry') and self.model_registry:
                cnn_models = self.model_registry.get_models_by_type('cnn')

                if cnn_models:
                    hidden_features = {}
                    predictions = {}

                    for model_name, model in cnn_models.items():
                        try:
                            # Get recent market data for the model
                            feature_matrix = self.data_provider.get_feature_matrix(
                                symbol=symbol,
                                timeframes=['1s', '1m', '1h', '1d'],
                                window_size=50
                            )

                            if feature_matrix is not None:
                                # Extract hidden features and predictions
                                model_hidden, model_pred = self._extract_cnn_features(model, feature_matrix)
                                if model_hidden is not None:
                                    hidden_features[model_name] = model_hidden
                                if model_pred is not None:
                                    predictions[model_name] = model_pred

                        except Exception as e:
                            logger.warning(f"Error getting features from CNN model {model_name}: {e}")

                    return hidden_features if hidden_features else None, predictions if predictions else None

            return None, None

        except Exception as e:
            logger.warning(f"Error getting CNN features for {symbol}: {e}")
            return None, None

    def _extract_cnn_features(self, model, feature_matrix: np.ndarray) -> Tuple[Optional[np.ndarray], Optional[np.ndarray]]:
        """Extract hidden features and predictions from CNN model"""
        try:
            # This would need to be implemented based on your specific CNN architecture
            # For now, return placeholder values

            # Mock hidden features (would be extracted from model's hidden layers)
            hidden_features = np.random.random(512).astype(np.float32)

            # Mock predictions (would be model's output)
            predictions = np.array([0.33, 0.33, 0.34, 0.7]).astype(np.float32)  # BUY, SELL, HOLD, confidence

            return hidden_features, predictions

        except Exception as e:
            logger.warning(f"Error extracting CNN features: {e}")
            return None, None

    def _calculate_pivot_points_for_rl(self, ohlcv_data: Dict[str, List]) -> Optional[Dict[str, Any]]:
        """Calculate Williams pivot points for RL state building"""
        try:
            if '1m' in ohlcv_data and len(ohlcv_data['1m']) >= 50:
                # Use 1m data for pivot calculation
                bars = ohlcv_data['1m']

                # Convert to numpy array
                ohlc_array = np.array([
                    [bar['timestamp'].timestamp() if hasattr(bar['timestamp'], 'timestamp') else time.time(),
                     bar['open'], bar['high'], bar['low'], bar['close'], bar['volume']]
                    for bar in bars[-200:]  # Last 200 bars
                ])

                # Calculate pivot points using Williams structure
                # This would use the WilliamsMarketStructure implementation
                pivot_data = {
                    'swing_highs': [],
                    'swing_lows': [],
                    'trend_levels': [],
                    'market_bias': 'neutral'
                }

                return pivot_data

            return None

        except Exception as e:
            logger.warning(f"Error calculating pivot points: {e}")
            return None

    def _analyze_market_microstructure(self, raw_ticks: List[Dict[str, Any]]) -> Dict[str, Any]:
        """Analyze market microstructure from tick data"""
        try:
            if not raw_ticks or len(raw_ticks) < 10:
                return {}

            # Calculate microstructure metrics
            prices = [tick['price'] for tick in raw_ticks]
            volumes = [tick['volume'] for tick in raw_ticks]

            # Price momentum
            price_momentum = (prices[-1] - prices[0]) / prices[0] if prices[0] != 0 else 0

            # Volume pattern
            avg_volume = sum(volumes) / len(volumes)
            recent_volume = sum(volumes[-10:]) / 10 if len(volumes) >= 10 else avg_volume
            volume_intensity = recent_volume / avg_volume if avg_volume != 0 else 1.0

            # Tick frequency
            if len(raw_ticks) >= 2:
                time_diffs = []
                for i in range(1, len(raw_ticks)):
                    if hasattr(raw_ticks[i]['timestamp'], 'timestamp') and hasattr(raw_ticks[i-1]['timestamp'], 'timestamp'):
                        diff = raw_ticks[i]['timestamp'].timestamp() - raw_ticks[i-1]['timestamp'].timestamp()
                        time_diffs.append(diff)

                avg_tick_interval = sum(time_diffs) / len(time_diffs) if time_diffs else 1.0
            else:
                avg_tick_interval = 1.0

            return {
                'price_momentum': price_momentum,
                'volume_intensity': volume_intensity,
                'avg_tick_interval': avg_tick_interval,
                'tick_count': len(raw_ticks),
                'price_volatility': np.std(prices) if len(prices) > 1 else 0.0
            }

        except Exception as e:
            logger.warning(f"Error analyzing market microstructure: {e}")
            return {}

    async def _get_enhanced_predictions_universal(self, symbol: str, market_state: MarketState,
                                                universal_stream: UniversalDataStream) -> List[EnhancedPrediction]:
        """Get enhanced predictions using universal data format"""
        predictions = []

        for model_name, model in self.model_registry.models.items():
            try:
                if isinstance(model, CNNModelInterface):
                    # Format universal data for CNN model
                    cnn_data = self.universal_adapter.format_for_model(universal_stream, 'cnn')

                    # Get CNN predictions for each timeframe using universal data
                    timeframe_predictions = []

                    # ETH timeframes (primary trading pair)
                    if symbol == 'ETH/USDT':
                        timeframe_data_map = {
                            '1s': cnn_data.get('eth_ticks'),
                            '1m': cnn_data.get('eth_1m'),
                            '1h': cnn_data.get('eth_1h'),
                            '1d': cnn_data.get('eth_1d')
                        }
                    # BTC reference
                    elif symbol == 'BTC/USDT':
                        timeframe_data_map = {
                            '1s': cnn_data.get('btc_ticks')
                        }
                    else:
                        continue

                    for timeframe, feature_matrix in timeframe_data_map.items():
                        if feature_matrix is not None and len(feature_matrix) > 0:
                            # Get timeframe-specific prediction using universal data
                            action_probs, confidence = await self._get_timeframe_prediction_universal(
                                model, feature_matrix, timeframe, market_state, universal_stream
                            )

                            if action_probs is not None:
                                action_names = ['SELL', 'HOLD', 'BUY']
                                best_action_idx = np.argmax(action_probs)
                                best_action = action_names[best_action_idx]

                                # Create timeframe prediction
                                tf_prediction = TimeframePrediction(
                                    timeframe=timeframe,
                                    action=best_action,
                                    confidence=float(confidence),
                                    probabilities={name: float(prob) for name, prob in zip(action_names, action_probs)},
                                    timestamp=datetime.now(),
                                    market_features={
                                        'volatility': market_state.volatility,
                                        'volume': market_state.volume,
                                        'trend_strength': market_state.trend_strength,
                                        'data_quality': universal_stream.metadata['data_quality']['overall_score']
                                    }
                                )
                                timeframe_predictions.append(tf_prediction)

                    if timeframe_predictions:
                        # Combine timeframe predictions into overall prediction
                        overall_action, overall_confidence = self._combine_timeframe_predictions(
                            timeframe_predictions, symbol
                        )

                        enhanced_pred = EnhancedPrediction(
                            symbol=symbol,
                            timeframe_predictions=timeframe_predictions,
                            overall_action=overall_action,
                            overall_confidence=overall_confidence,
                            model_name=model.name,
                            timestamp=datetime.now(),
                            metadata={
                                'market_regime': market_state.market_regime,
                                'symbol_correlation': self._get_symbol_correlation(symbol),
                                'universal_data_quality': universal_stream.metadata['data_quality'],
                                'data_freshness': universal_stream.metadata['data_freshness']
                            }
                        )
                        predictions.append(enhanced_pred)

            except Exception as e:
                logger.error(f"Error getting enhanced predictions from {model_name}: {e}")

        return predictions

    async def _get_timeframe_prediction_universal(self, model: CNNModelInterface, feature_matrix: np.ndarray,
                                                timeframe: str, market_state: MarketState,
                                                universal_stream: UniversalDataStream) -> Tuple[Optional[np.ndarray], float]:
        """Get prediction for specific timeframe using universal data format with CNN monitoring"""
        try:
            # Measure prediction timing
            prediction_start_time = time.time()

            # Get current price for context
            current_price = market_state.prices.get(timeframe)

            # Check if model supports timeframe-specific prediction or enhanced predict method
            if hasattr(model, 'predict_timeframe'):
                action_probs, confidence = model.predict_timeframe(feature_matrix, timeframe)
            elif hasattr(model, 'predict') and hasattr(model.predict, '__call__'):
                # Enhanced CNN model with detailed output
                if hasattr(model, 'enhanced_predict'):
                    # Get detailed prediction results
                    prediction_result = model.enhanced_predict(feature_matrix)
                    action_probs = prediction_result.get('probabilities', [])
                    confidence = prediction_result.get('confidence', 0.0)
                else:
                    # Standard prediction
                    prediction_result = model.predict(feature_matrix)
                    if isinstance(prediction_result, dict):
                        action_probs = prediction_result.get('probabilities', [])
                        confidence = prediction_result.get('confidence', 0.0)
                    else:
                        action_probs, confidence = prediction_result
            else:
                action_probs, confidence = model.predict(feature_matrix)

            # Calculate prediction latency
            prediction_latency_ms = (time.time() - prediction_start_time) * 1000

            if action_probs is not None and confidence is not None:
                # Enhance confidence based on universal data quality and market conditions
                enhanced_confidence = self._enhance_confidence_with_universal_context(
                    confidence, timeframe, market_state, universal_stream
                )

                # Log detailed CNN prediction for monitoring
                try:
                    # Convert probabilities to list if needed
                    if hasattr(action_probs, 'tolist'):
                        prob_list = action_probs.tolist()
                    elif isinstance(action_probs, (list, tuple)):
                        prob_list = list(action_probs)
                    else:
                        prob_list = [float(action_probs)]

                    # Determine action and action confidence
                    if len(prob_list) >= 2:
                        action_idx = np.argmax(prob_list)
                        action_name = ['SELL', 'BUY'][action_idx] if len(prob_list) == 2 else ['SELL', 'HOLD', 'BUY'][action_idx]
                        action_confidence = prob_list[action_idx]
                    else:
                        action_idx = 0
                        action_name = 'HOLD'
                        action_confidence = enhanced_confidence

                    # Get model memory usage if available
                    model_memory_mb = None
                    if hasattr(model, 'get_memory_usage'):
                        try:
                            memory_info = model.get_memory_usage()
                            if isinstance(memory_info, dict):
                                model_memory_mb = memory_info.get('total_size_mb', 0.0)
                            else:
                                model_memory_mb = float(memory_info)
                        except:
                            pass

                    # Create detailed prediction result for monitoring
                    detailed_prediction = {
                        'action': action_idx,
                        'action_name': action_name,
                        'confidence': float(enhanced_confidence),
                        'action_confidence': float(action_confidence),
                        'probabilities': prob_list,
                        'raw_logits': prob_list  # Use probabilities as proxy for logits if not available
                    }

                    # Add enhanced model outputs if available
                    if hasattr(model, 'enhanced_predict') and isinstance(prediction_result, dict):
                        detailed_prediction.update({
                            'regime_probabilities': prediction_result.get('regime_probabilities'),
                            'volatility_prediction': prediction_result.get('volatility_prediction'),
                            'extrema_prediction': prediction_result.get('extrema_prediction'),
                            'risk_assessment': prediction_result.get('risk_assessment')
                        })

                    # Calculate price changes for context
                    price_change_1m = None
                    price_change_5m = None
                    volume_ratio = None

                    if current_price and timeframe in market_state.prices:
                        # Try to get historical prices for context
                        try:
                            # Get 1m and 5m price changes if available
                            if '1m' in market_state.prices and market_state.prices['1m'] != current_price:
                                price_change_1m = (current_price - market_state.prices['1m']) / market_state.prices['1m']
                            if '5m' in market_state.prices and market_state.prices['5m'] != current_price:
                                price_change_5m = (current_price - market_state.prices['5m']) / market_state.prices['5m']

                            # Volume ratio (current vs average)
                            volume_ratio = market_state.volume
                        except:
                            pass

                    # Log the CNN prediction with full context
                    log_cnn_prediction(
                        model_name=getattr(model, 'name', model.__class__.__name__),
                        symbol=market_state.symbol,
                        prediction_result=detailed_prediction,
                        feature_matrix_shape=feature_matrix.shape,
                        current_price=current_price,
                        prediction_latency_ms=prediction_latency_ms,
                        model_memory_usage_mb=model_memory_mb
                    )

                    # Enhanced logging for detailed analysis
                    logger.info(f"CNN [{getattr(model, 'name', 'Unknown')}] {market_state.symbol} {timeframe}: "
                               f"{action_name} (conf: {enhanced_confidence:.3f}, "
                               f"action_conf: {action_confidence:.3f}, "
                               f"latency: {prediction_latency_ms:.1f}ms)")

                    if detailed_prediction.get('regime_probabilities'):
                        regime_idx = np.argmax(detailed_prediction['regime_probabilities'])
                        regime_conf = detailed_prediction['regime_probabilities'][regime_idx]
                        logger.info(f"  Regime: {regime_idx} (conf: {regime_conf:.3f})")

                    if detailed_prediction.get('volatility_prediction') is not None:
                        logger.info(f"  Volatility: {detailed_prediction['volatility_prediction']:.3f}")

                    if price_change_1m is not None:
                        logger.info(f"  Context: 1m_change: {price_change_1m:.4f}, volume_ratio: {volume_ratio:.2f}")

                except Exception as e:
                    logger.warning(f"Error logging CNN prediction details: {e}")

                return action_probs, enhanced_confidence

        except Exception as e:
            logger.error(f"Error getting timeframe prediction for {timeframe}: {e}")

        return None, 0.0

    def _enhance_confidence_with_universal_context(self, base_confidence: float, timeframe: str,
                                                 market_state: MarketState,
                                                 universal_stream: UniversalDataStream) -> float:
        """Enhance confidence score based on universal data context"""
        enhanced = base_confidence

        # Adjust based on data quality from universal stream
        data_quality = universal_stream.metadata['data_quality']['overall_score']
        enhanced *= data_quality

        # Adjust based on data freshness
        freshness = universal_stream.metadata.get('data_freshness', {})
        if timeframe in ['1s', '1m']:
            # For short timeframes, penalize stale data more heavily
            eth_freshness = freshness.get(f'eth_{timeframe}', 0)
            if eth_freshness > 60:  # More than 1 minute old
                enhanced *= 0.8

        # Adjust based on market regime
        if market_state.market_regime == 'trending':
            enhanced *= 1.1  # More confident in trending markets
        elif market_state.market_regime == 'volatile':
            enhanced *= 0.8  # Less confident in volatile markets

        # Adjust based on timeframe reliability for scalping
        timeframe_reliability = {
            '1s': 1.0,   # Primary scalping timeframe
            '1m': 0.9,   # Short-term confirmation
            '5m': 0.8,   # Short-term momentum
            '15m': 0.9,  # Entry/exit timing
            '1h': 0.8,   # Medium-term trend
            '4h': 0.7,   # Longer-term (less relevant for scalping)
            '1d': 0.6    # Long-term direction (minimal for scalping)
        }
        enhanced *= timeframe_reliability.get(timeframe, 1.0)

        # Adjust based on volume
        if market_state.volume > 1.5:  # High volume
            enhanced *= 1.05
        elif market_state.volume < 0.5:  # Low volume
            enhanced *= 0.9

        # Adjust based on correlation with BTC (for ETH trades)
        if market_state.symbol == 'ETH/USDT' and len(universal_stream.btc_ticks) > 1:
            # Check ETH-BTC correlation strength
            eth_momentum = (universal_stream.eth_ticks[-1, 4] - universal_stream.eth_ticks[-2, 4]) / universal_stream.eth_ticks[-2, 4]
            btc_momentum = (universal_stream.btc_ticks[-1, 4] - universal_stream.btc_ticks[-2, 4]) / universal_stream.btc_ticks[-2, 4]

            # If ETH and BTC are moving in same direction, increase confidence
            if (eth_momentum > 0 and btc_momentum > 0) or (eth_momentum < 0 and btc_momentum < 0):
                enhanced *= 1.05
            else:
                enhanced *= 0.95

        return min(enhanced, 1.0)  # Cap at 1.0

    def _combine_timeframe_predictions(self, timeframe_predictions: List[TimeframePrediction],
                                     symbol: str) -> Tuple[str, float]:
        """Combine predictions from multiple timeframes"""
        action_scores = {'BUY': 0.0, 'SELL': 0.0, 'HOLD': 0.0}
        total_weight = 0.0

        for tf_pred in timeframe_predictions:
            # Get timeframe weight
            tf_weight = self.timeframe_weights.get(tf_pred.timeframe, 0.1)

            # Weight by confidence and timeframe importance
            weighted_confidence = tf_pred.confidence * tf_weight

            # Add to action scores
            action_scores[tf_pred.action] += weighted_confidence
            total_weight += weighted_confidence

        # Normalize scores
        if total_weight > 0:
            for action in action_scores:
                action_scores[action] /= total_weight

        # Get best action and confidence
        best_action = max(action_scores, key=action_scores.get)
        best_confidence = action_scores[best_action]

        return best_action, best_confidence

    async def _make_coordinated_decision(self, symbol: str, predictions: List[EnhancedPrediction],
                                       all_predictions: Dict[str, List[EnhancedPrediction]],
                                       market_state: MarketState) -> Optional[TradingAction]:
        """Make decision using streamlined 2-action system with position intelligence"""
        if not predictions:
            return None

        try:
            # Use new 2-action decision making
            decision = self._make_2_action_decision(symbol, predictions, market_state)

            if decision:
                # Store recent action for tracking
                self.recent_actions[symbol].append(decision)

                logger.info(f"[SUCCESS] Coordinated decision for {symbol}: {decision.action} "
                           f"(confidence: {decision.confidence:.3f}, "
                           f"reasoning: {decision.reasoning.get('action_type', 'UNKNOWN')})")

                return decision
            else:
                logger.debug(f"No decision made for {symbol} - insufficient confidence or position conflict")
                return None

        except Exception as e:
            logger.error(f"Error making coordinated decision for {symbol}: {e}")
            return None

    def _is_closing_action(self, symbol: str, action: str) -> bool:
        """Determine if an action would close an existing position"""
        if symbol not in self.current_positions:
            return False

        current_position = self.current_positions[symbol]

        # Closing logic: opposite action closes position
        if current_position['side'] == 'LONG' and action == 'SELL':
            return True
        elif current_position['side'] == 'SHORT' and action == 'BUY':
            return True

        return False

    def _update_position_tracking(self, symbol: str, action: TradingAction):
        """Update internal position tracking for threshold logic"""
        if action.action == 'BUY':
            # Close any short position, open long position
            if symbol in self.current_positions and self.current_positions[symbol]['side'] == 'SHORT':
                self._close_trade_for_sensitivity_learning(symbol, action)
                del self.current_positions[symbol]
            else:
                self._open_trade_for_sensitivity_learning(symbol, action)
                self.current_positions[symbol] = {
                    'side': 'LONG',
                    'entry_price': action.price,
                    'timestamp': action.timestamp
                }
        elif action.action == 'SELL':
            # Close any long position, open short position
            if symbol in self.current_positions and self.current_positions[symbol]['side'] == 'LONG':
                self._close_trade_for_sensitivity_learning(symbol, action)
                del self.current_positions[symbol]
            else:
                self._open_trade_for_sensitivity_learning(symbol, action)
                self.current_positions[symbol] = {
                    'side': 'SHORT',
                    'entry_price': action.price,
                    'timestamp': action.timestamp
                }

    def _open_trade_for_sensitivity_learning(self, symbol: str, action: TradingAction):
        """Track trade opening for sensitivity learning"""
        try:
            # Get current market state for learning context
            market_state = self._get_current_market_state_for_sensitivity(symbol)

            trade_info = {
                'symbol': symbol,
                'side': 'LONG' if action.action == 'BUY' else 'SHORT',
                'entry_price': action.price,
                'entry_time': action.timestamp,
                'entry_confidence': action.confidence,
                'entry_market_state': market_state,
                'sensitivity_level_at_entry': self.current_sensitivity_level,
                'thresholds_used': {
                    'open': self._get_current_open_threshold(),
                    'close': self._get_current_close_threshold()
                }
            }

            self.active_trades[symbol] = trade_info
            logger.info(f"Opened trade for sensitivity learning: {symbol} {trade_info['side']} @ ${action.price:.2f}")

        except Exception as e:
            logger.error(f"Error tracking trade opening for sensitivity learning: {e}")

    def _close_trade_for_sensitivity_learning(self, symbol: str, action: TradingAction):
        """Track trade closing and create learning case for DQN"""
        try:
            if symbol not in self.active_trades:
                return

            trade_info = self.active_trades[symbol]

            # Calculate trade outcome
            entry_price = trade_info['entry_price']
            exit_price = action.price
            side = trade_info['side']

            if side == 'LONG':
                pnl_pct = (exit_price - entry_price) / entry_price
            else:  # SHORT
                pnl_pct = (entry_price - exit_price) / entry_price

            # Calculate trade duration
            duration = (action.timestamp - trade_info['entry_time']).total_seconds()

            # Get current market state for exit context
            exit_market_state = self._get_current_market_state_for_sensitivity(symbol)

            # Create completed trade record
            completed_trade = {
                'symbol': symbol,
                'side': side,
                'entry_price': entry_price,
                'exit_price': exit_price,
                'entry_time': trade_info['entry_time'],
                'exit_time': action.timestamp,
                'duration': duration,
                'pnl_pct': pnl_pct,
                'entry_confidence': trade_info['entry_confidence'],
                'exit_confidence': action.confidence,
                'entry_market_state': trade_info['entry_market_state'],
                'exit_market_state': exit_market_state,
                'sensitivity_level_used': trade_info['sensitivity_level_at_entry'],
                'thresholds_used': trade_info['thresholds_used']
            }

            self.completed_trades.append(completed_trade)

            # Create sensitivity learning case for DQN
            self._create_sensitivity_learning_case(completed_trade)

            # Remove from active trades
            del self.active_trades[symbol]

            logger.info(f"Closed trade for sensitivity learning: {symbol} {side} P&L: {pnl_pct*100:+.2f}% Duration: {duration:.0f}s")

        except Exception as e:
            logger.error(f"Error tracking trade closing for sensitivity learning: {e}")

    def _get_current_market_state_for_sensitivity(self, symbol: str) -> Dict[str, float]:
        """Get current market state features for sensitivity learning"""
        try:
            # Get recent price data
            recent_data = self.data_provider.get_historical_data(symbol, '1m', limit=20)

            if recent_data is None or len(recent_data) < 10:
                return self._get_default_market_state()

            # Calculate market features
            current_price = recent_data['close'].iloc[-1]

            # Volatility (20-period)
            volatility = recent_data['close'].pct_change().std() * 100

            # Price momentum (5-period)
            momentum_5 = (current_price - recent_data['close'].iloc[-6]) / recent_data['close'].iloc[-6] * 100

            # Volume ratio
            avg_volume = recent_data['volume'].mean()
            current_volume = recent_data['volume'].iloc[-1]
            volume_ratio = current_volume / avg_volume if avg_volume > 0 else 1.0

            # RSI
            rsi = recent_data['rsi'].iloc[-1] if 'rsi' in recent_data.columns else 50.0

            # MACD signal
            macd_signal = 0.0
            if 'macd' in recent_data.columns and 'macd_signal' in recent_data.columns:
                macd_signal = recent_data['macd'].iloc[-1] - recent_data['macd_signal'].iloc[-1]

            # Bollinger Band position
            bb_position = 0.5  # Default middle
            if 'bb_upper' in recent_data.columns and 'bb_lower' in recent_data.columns:
                bb_upper = recent_data['bb_upper'].iloc[-1]
                bb_lower = recent_data['bb_lower'].iloc[-1]
                if bb_upper > bb_lower:
                    bb_position = (current_price - bb_lower) / (bb_upper - bb_lower)

                        # Recent price change patterns
            price_changes = recent_data['close'].pct_change().tail(5).tolist()

            return {
                'volatility': volatility,
                'momentum_5': momentum_5,
                'volume_ratio': volume_ratio,
                'rsi': rsi,
                'macd_signal': macd_signal,
                'bb_position': bb_position,
                'price_change_1': price_changes[-1] if len(price_changes) > 0 else 0.0,
                'price_change_2': price_changes[-2] if len(price_changes) > 1 else 0.0,
                'price_change_3': price_changes[-3] if len(price_changes) > 2 else 0.0,
                'price_change_4': price_changes[-4] if len(price_changes) > 3 else 0.0,
                'price_change_5': price_changes[-5] if len(price_changes) > 4 else 0.0
            }

        except Exception as e:
            logger.error(f"Error getting market state for sensitivity learning: {e}")
            return self._get_default_market_state()

    def _get_default_market_state(self) -> Dict[str, float]:
        """Get default market state when data is unavailable"""
        return {
            'volatility': 2.0,
            'momentum_5': 0.0,
            'volume_ratio': 1.0,
            'rsi': 50.0,
            'macd_signal': 0.0,
            'bb_position': 0.5,
            'price_change_1': 0.0,
            'price_change_2': 0.0,
            'price_change_3': 0.0,
            'price_change_4': 0.0,
            'price_change_5': 0.0
        }

    def _create_sensitivity_learning_case(self, completed_trade: Dict[str, Any]):
        """Create a learning case for the DQN sensitivity agent"""
        try:
            # Create state vector from market conditions at entry
            entry_state = self._market_state_to_sensitivity_state(
                completed_trade['entry_market_state'],
                completed_trade['sensitivity_level_used']
            )

            # Create state vector from market conditions at exit
            exit_state = self._market_state_to_sensitivity_state(
                completed_trade['exit_market_state'],
                completed_trade['sensitivity_level_used']
            )

            # Calculate reward based on trade outcome
            reward = self._calculate_sensitivity_reward(completed_trade)

            # Determine optimal sensitivity action based on outcome
            optimal_sensitivity = self._determine_optimal_sensitivity(completed_trade)

            # Create learning experience
            learning_case = {
                'state': entry_state,
                'action': completed_trade['sensitivity_level_used'],
                'reward': reward,
                'next_state': exit_state,
                'done': True,  # Trade is completed
                'optimal_action': optimal_sensitivity,
                'trade_outcome': completed_trade['pnl_pct'],
                'trade_duration': completed_trade['duration'],
                'symbol': completed_trade['symbol']
            }

            self.sensitivity_learning_queue.append(learning_case)

            # Train DQN if we have enough cases
            if len(self.sensitivity_learning_queue) >= 32:  # Batch size
                self._train_sensitivity_dqn()

            logger.info(f"Created sensitivity learning case: reward={reward:.3f}, optimal_sensitivity={optimal_sensitivity}")

        except Exception as e:
            logger.error(f"Error creating sensitivity learning case: {e}")

    def _market_state_to_sensitivity_state(self, market_state: Dict[str, float], current_sensitivity: int) -> np.ndarray:
        """Convert market state to DQN state vector for sensitivity learning"""
        try:
            # Create state vector with market features + current sensitivity
            state_features = [
                market_state.get('volatility', 2.0) / 10.0,  # Normalize volatility
                market_state.get('momentum_5', 0.0) / 5.0,   # Normalize momentum
                market_state.get('volume_ratio', 1.0),       # Volume ratio
                market_state.get('rsi', 50.0) / 100.0,       # Normalize RSI
                market_state.get('macd_signal', 0.0) / 2.0,  # Normalize MACD
                market_state.get('bb_position', 0.5),        # BB position (already 0-1)
                market_state.get('price_change_1', 0.0) * 100,  # Recent price changes
                market_state.get('price_change_2', 0.0) * 100,
                market_state.get('price_change_3', 0.0) * 100,
                market_state.get('price_change_4', 0.0) * 100,
                market_state.get('price_change_5', 0.0) * 100,
                current_sensitivity / 4.0,  # Normalize current sensitivity (0-4 -> 0-1)
            ]

            # Add recent performance metrics
            if len(self.completed_trades) > 0:
                recent_trades = list(self.completed_trades)[-10:]  # Last 10 trades
                avg_pnl = np.mean([t['pnl_pct'] for t in recent_trades])
                win_rate = len([t for t in recent_trades if t['pnl_pct'] > 0]) / len(recent_trades)
                avg_duration = np.mean([t['duration'] for t in recent_trades]) / 3600  # Normalize to hours
            else:
                avg_pnl = 0.0
                win_rate = 0.5
                avg_duration = 0.5

            state_features.extend([
                avg_pnl * 10,  # Recent average P&L
                win_rate,      # Recent win rate
                avg_duration,  # Recent average duration
            ])

            # Pad or truncate to exact state size
            while len(state_features) < self.sensitivity_state_size:
                state_features.append(0.0)

            state_features = state_features[:self.sensitivity_state_size]

            return np.array(state_features, dtype=np.float32)

        except Exception as e:
            logger.error(f"Error converting market state to sensitivity state: {e}")
            return np.zeros(self.sensitivity_state_size, dtype=np.float32)

    def _calculate_sensitivity_reward(self, completed_trade: Dict[str, Any]) -> float:
        """Calculate reward for sensitivity learning based on trade outcome"""
        try:
            pnl_pct = completed_trade['pnl_pct']
            duration = completed_trade['duration']

            # Base reward from P&L
            base_reward = pnl_pct * 10  # Scale P&L percentage

            # Duration penalty/bonus
            if duration < 300:  # Less than 5 minutes - too quick
                duration_factor = 0.8
            elif duration < 1800:  # Less than 30 minutes - good for scalping
                duration_factor = 1.2
            elif duration < 3600:  # Less than 1 hour - acceptable
                duration_factor = 1.0
            else:  # More than 1 hour - too slow for scalping
                duration_factor = 0.7

            # Confidence factor - reward appropriate confidence levels
            entry_conf = completed_trade['entry_confidence']
            exit_conf = completed_trade['exit_confidence']

            if pnl_pct > 0:  # Winning trade
                # Reward high entry confidence and appropriate exit confidence
                conf_factor = (entry_conf + exit_conf) / 2
            else:  # Losing trade
                # Reward quick exit (high exit confidence for losses)
                conf_factor = exit_conf

            # Calculate final reward
            final_reward = base_reward * duration_factor * conf_factor

            # Clip reward to reasonable range
            final_reward = np.clip(final_reward, -2.0, 2.0)

            return float(final_reward)

        except Exception as e:
            logger.error(f"Error calculating sensitivity reward: {e}")
            return 0.0

    def _determine_optimal_sensitivity(self, completed_trade: Dict[str, Any]) -> int:
        """Determine optimal sensitivity level based on trade outcome"""
        try:
            pnl_pct = completed_trade['pnl_pct']
            duration = completed_trade['duration']
            current_sensitivity = completed_trade['sensitivity_level_used']

            # If trade was profitable and quick, current sensitivity was good
            if pnl_pct > 0.01 and duration < 1800:  # >1% profit in <30 min
                return current_sensitivity

            # If trade was very profitable, could have been more aggressive
            if pnl_pct > 0.02:  # >2% profit
                return min(4, current_sensitivity + 1)  # Increase sensitivity

            # If trade was a small loss, might need more sensitivity
            if -0.01 < pnl_pct < 0:  # Small loss
                return min(4, current_sensitivity + 1)  # Increase sensitivity

            # If trade was a big loss, need less sensitivity
            if pnl_pct < -0.02:  # >2% loss
                return max(0, current_sensitivity - 1)  # Decrease sensitivity

            # If trade took too long, need more sensitivity
            if duration > 3600:  # >1 hour
                return min(4, current_sensitivity + 1)  # Increase sensitivity

            # Default: keep current sensitivity
            return current_sensitivity

        except Exception as e:
            logger.error(f"Error determining optimal sensitivity: {e}")
            return 2  # Default to medium

    def _train_sensitivity_dqn(self):
        """Train the DQN agent for sensitivity learning"""
        try:
            # Initialize DQN agent if not already done
            if self.sensitivity_dqn_agent is None:
                self._initialize_sensitivity_dqn()

            if self.sensitivity_dqn_agent is None:
                return

            # Get batch of learning cases
            batch_size = min(32, len(self.sensitivity_learning_queue))
            if batch_size < 8:  # Need minimum batch size
                return

            # Sample random batch
            batch_indices = np.random.choice(len(self.sensitivity_learning_queue), batch_size, replace=False)
            batch = [self.sensitivity_learning_queue[i] for i in batch_indices]

            # Train the DQN agent
            for case in batch:
                self.sensitivity_dqn_agent.remember(
                    state=case['state'],
                    action=case['action'],
                    reward=case['reward'],
                    next_state=case['next_state'],
                    done=case['done']
                )

            # Perform replay training
            loss = self.sensitivity_dqn_agent.replay()

            if loss is not None:
                logger.info(f"Sensitivity DQN training completed. Loss: {loss:.4f}")

                # Update current sensitivity level based on recent performance
                self._update_current_sensitivity_level()

        except Exception as e:
            logger.error(f"Error training sensitivity DQN: {e}")

    def _initialize_sensitivity_dqn(self):
        """Initialize the DQN agent for sensitivity learning"""
        try:
            # Try to import DQN agent
            from NN.models.dqn_agent import DQNAgent

            # Create DQN agent for sensitivity learning
            self.sensitivity_dqn_agent = DQNAgent(
                state_shape=(self.sensitivity_state_size,),
                n_actions=self.sensitivity_action_space,
                learning_rate=0.001,
                gamma=0.95,
                epsilon=0.3,  # Lower epsilon for more exploitation
                epsilon_min=0.05,
                epsilon_decay=0.995,
                buffer_size=1000,
                batch_size=32,
                target_update=10
            )

            logger.info("Sensitivity DQN agent initialized successfully")

        except Exception as e:
            logger.error(f"Error initializing sensitivity DQN agent: {e}")
            self.sensitivity_dqn_agent = None

    def _update_current_sensitivity_level(self):
        """Update current sensitivity level using trained DQN"""
        try:
            if self.sensitivity_dqn_agent is None:
                return

            # Get current market state
            current_market_state = self._get_current_market_state_for_sensitivity('ETH/USDT')  # Use ETH as primary
            current_state = self._market_state_to_sensitivity_state(current_market_state, self.current_sensitivity_level)

            # Get action from DQN (without exploration for production use)
            action = self.sensitivity_dqn_agent.act(current_state, explore=False)

            # Update sensitivity level if it changed
            if action != self.current_sensitivity_level:
                old_level = self.current_sensitivity_level
                self.current_sensitivity_level = action

                # Update thresholds based on new sensitivity level
                self._update_thresholds_from_sensitivity()

                logger.info(f"Sensitivity level updated: {self.sensitivity_levels[old_level]['name']} -> {self.sensitivity_levels[action]['name']}")

        except Exception as e:
            logger.error(f"Error updating current sensitivity level: {e}")

    def _update_thresholds_from_sensitivity(self):
        """Update confidence thresholds based on current sensitivity level"""
        try:
            sensitivity_config = self.sensitivity_levels[self.current_sensitivity_level]

            # Get base thresholds from config
            base_open_threshold = self.config.orchestrator.get('confidence_threshold', 0.6)
            base_close_threshold = self.config.orchestrator.get('confidence_threshold_close', 0.25)

            # Apply sensitivity multipliers
            self.confidence_threshold_open = base_open_threshold * sensitivity_config['open_threshold_multiplier']
            self.confidence_threshold_close = base_close_threshold * sensitivity_config['close_threshold_multiplier']

            # Ensure thresholds stay within reasonable bounds
            self.confidence_threshold_open = np.clip(self.confidence_threshold_open, 0.3, 0.9)
            self.confidence_threshold_close = np.clip(self.confidence_threshold_close, 0.1, 0.6)

            logger.info(f"Updated thresholds - Open: {self.confidence_threshold_open:.3f}, Close: {self.confidence_threshold_close:.3f}")

        except Exception as e:
            logger.error(f"Error updating thresholds from sensitivity: {e}")

    def _get_current_open_threshold(self) -> float:
        """Get current opening threshold"""
        return self.confidence_threshold_open

    def _get_current_close_threshold(self) -> float:
        """Get current closing threshold"""
        return self.confidence_threshold_close

    def _initialize_context_data(self):
        """Initialize 200-candle 1m context data for all symbols"""
        try:
            logger.info("Initializing 200-candle 1m context data for enhanced model performance")

            for symbol in self.symbols:
                try:
                    # Load 200 candles of 1m data
                    context_data = self.data_provider.get_historical_data(symbol, '1m', limit=200)

                    if context_data is not None and len(context_data) > 0:
                        # Store raw data
                        for _, row in context_data.iterrows():
                            candle_data = {
                                'timestamp': row['timestamp'],
                                'open': row['open'],
                                'high': row['high'],
                                'low': row['low'],
                                'close': row['close'],
                                'volume': row['volume']
                            }
                            self.context_data_1m[symbol].append(candle_data)

                        # Create feature matrix for models
                        self.context_features_1m[symbol] = self._create_context_features(context_data)

                        logger.info(f"Loaded {len(context_data)} 1m candles for {symbol} context")
                    else:
                        logger.warning(f"No 1m context data available for {symbol}")

                except Exception as e:
                    logger.error(f"Error loading context data for {symbol}: {e}")

        except Exception as e:
            logger.error(f"Error initializing context data: {e}")

    def _create_context_features(self, df: pd.DataFrame) -> Optional[np.ndarray]:
        """Create feature matrix from 1m context data for model consumption"""
        try:
            if df is None or len(df) < 50:
                return None

            # Select key features for context
            feature_columns = ['open', 'high', 'low', 'close', 'volume']

            # Add technical indicators if available
            if 'rsi_14' in df.columns:
                feature_columns.extend(['rsi_14', 'sma_20', 'ema_12'])
            if 'macd' in df.columns:
                feature_columns.extend(['macd', 'macd_signal'])
            if 'bb_upper' in df.columns:
                feature_columns.extend(['bb_upper', 'bb_lower', 'bb_percent'])

            # Extract available features
            available_features = [col for col in feature_columns if col in df.columns]
            feature_data = df[available_features].copy()

            # Normalize features
            normalized_features = self._normalize_context_features(feature_data)

            return normalized_features.values if normalized_features is not None else None

        except Exception as e:
            logger.error(f"Error creating context features: {e}")
            return None

    def _normalize_context_features(self, df: pd.DataFrame) -> Optional[pd.DataFrame]:
        """Normalize context features for model consumption"""
        try:
            df_norm = df.copy()

            # Price normalization (relative to latest close)
            if 'close' in df_norm.columns:
                latest_close = df_norm['close'].iloc[-1]
                for col in ['open', 'high', 'low', 'close', 'sma_20', 'ema_12', 'bb_upper', 'bb_lower']:
                    if col in df_norm.columns and latest_close > 0:
                        df_norm[col] = df_norm[col] / latest_close

            # Volume normalization
            if 'volume' in df_norm.columns:
                volume_mean = df_norm['volume'].mean()
                if volume_mean > 0:
                    df_norm['volume'] = df_norm['volume'] / volume_mean

            # RSI normalization (0-100 to 0-1)
            if 'rsi_14' in df_norm.columns:
                df_norm['rsi_14'] = df_norm['rsi_14'] / 100.0

            # MACD normalization
            if 'macd' in df_norm.columns and 'close' in df.columns:
                latest_close = df['close'].iloc[-1]
                df_norm['macd'] = df_norm['macd'] / latest_close
                if 'macd_signal' in df_norm.columns:
                    df_norm['macd_signal'] = df_norm['macd_signal'] / latest_close

            # BB percent is already normalized
            if 'bb_percent' in df_norm.columns:
                df_norm['bb_percent'] = np.clip(df_norm['bb_percent'], 0, 1)

            # Fill NaN values
            df_norm = df_norm.fillna(0)

            return df_norm

        except Exception as e:
            logger.error(f"Error normalizing context features: {e}")
            return df

    def update_context_data(self, symbol: str = None):
        """Update 200-candle 1m context data for specified symbol or all symbols"""
        try:
            symbols_to_update = [symbol] if symbol else self.symbols

            for sym in symbols_to_update:
                # Check if update is needed
                time_since_update = (datetime.now() - self.last_context_update[sym]).total_seconds()

                if time_since_update >= self.context_update_frequency:
                    # Get latest 1m data
                    latest_data = self.data_provider.get_historical_data(sym, '1m', limit=10, refresh=True)

                    if latest_data is not None and len(latest_data) > 0:
                        # Add new candles to context
                        for _, row in latest_data.iterrows():
                            candle_data = {
                                'timestamp': row['timestamp'],
                                'open': row['open'],
                                'high': row['high'],
                                'low': row['low'],
                                'close': row['close'],
                                'volume': row['volume']
                            }

                            # Check if this candle is newer than our latest
                            if (not self.context_data_1m[sym] or
                                candle_data['timestamp'] > self.context_data_1m[sym][-1]['timestamp']):
                                self.context_data_1m[sym].append(candle_data)

                        # Update feature matrix
                        if len(self.context_data_1m[sym]) >= 50:
                            context_df = pd.DataFrame(list(self.context_data_1m[sym]))
                            self.context_features_1m[sym] = self._create_context_features(context_df)

                        self.last_context_update[sym] = datetime.now()

                        # Check for local extrema in updated data
                        self._detect_local_extrema(sym)

        except Exception as e:
            logger.error(f"Error updating context data: {e}")

    def _detect_local_extrema(self, symbol: str):
        """Detect local bottoms and tops for training opportunities"""
        try:
            if len(self.context_data_1m[symbol]) < self.extrema_detection_window * 2:
                return

            # Get recent price data
            recent_candles = list(self.context_data_1m[symbol])[-self.extrema_detection_window * 2:]
            prices = [candle['close'] for candle in recent_candles]
            timestamps = [candle['timestamp'] for candle in recent_candles]

            # Detect local minima (bottoms) and maxima (tops)
            window = self.extrema_detection_window

            for i in range(window, len(prices) - window):
                current_price = prices[i]
                current_time = timestamps[i]

                # Check for local bottom
                is_bottom = all(current_price <= prices[j] for j in range(i - window, i + window + 1) if j != i)

                # Check for local top
                is_top = all(current_price >= prices[j] for j in range(i - window, i + window + 1) if j != i)

                if is_bottom or is_top:
                    extrema_type = 'bottom' if is_bottom else 'top'

                    # Create training opportunity
                    extrema_data = {
                        'symbol': symbol,
                        'timestamp': current_time,
                        'price': current_price,
                        'type': extrema_type,
                        'context_before': prices[max(0, i - window):i],
                        'context_after': prices[i + 1:min(len(prices), i + window + 1)],
                        'optimal_action': 'BUY' if is_bottom else 'SELL',
                        'confidence_level': self._calculate_extrema_confidence(prices, i, window),
                        'market_context': self._get_extrema_market_context(symbol, current_time)
                    }

                    self.local_extrema[symbol].append(extrema_data)
                    self.extrema_training_queue.append(extrema_data)

                    logger.info(f"Local {extrema_type} detected for {symbol} at ${current_price:.2f} "
                              f"(confidence: {extrema_data['confidence_level']:.3f})")

                    # Create perfect move for CNN training
                    self._create_extrema_perfect_move(extrema_data)

            self.last_extrema_check[symbol] = datetime.now()

        except Exception as e:
            logger.error(f"Error detecting local extrema for {symbol}: {e}")

    def _calculate_extrema_confidence(self, prices: List[float], extrema_index: int, window: int) -> float:
        """Calculate confidence level for detected extrema"""
        try:
            extrema_price = prices[extrema_index]

            # Calculate price deviation from extrema
            surrounding_prices = prices[max(0, extrema_index - window):extrema_index + window + 1]
            price_range = max(surrounding_prices) - min(surrounding_prices)

            if price_range == 0:
                return 0.5

            # Calculate how extreme the point is
            if extrema_price == min(surrounding_prices):  # Bottom
                deviation = (max(surrounding_prices) - extrema_price) / price_range
            else:  # Top
                deviation = (extrema_price - min(surrounding_prices)) / price_range

            # Confidence based on how clear the extrema is
            confidence = min(0.95, max(0.3, deviation))

            return confidence

        except Exception as e:
            logger.error(f"Error calculating extrema confidence: {e}")
            return 0.5

    def _get_extrema_market_context(self, symbol: str, timestamp: datetime) -> Dict[str, Any]:
        """Get market context at the time of extrema detection"""
        try:
            # Get recent market data around the extrema
            context = {
                'volatility': 0.0,
                'volume_spike': False,
                'trend_strength': 0.0,
                'rsi_level': 50.0
            }

            if len(self.context_data_1m[symbol]) >= 20:
                recent_candles = list(self.context_data_1m[symbol])[-20:]

                # Calculate volatility
                prices = [c['close'] for c in recent_candles]
                price_changes = [abs(prices[i] - prices[i-1]) / prices[i-1] for i in range(1, len(prices))]
                context['volatility'] = np.mean(price_changes) if price_changes else 0.0

                # Check for volume spike
                volumes = [c['volume'] for c in recent_candles]
                avg_volume = np.mean(volumes[:-1]) if len(volumes) > 1 else volumes[0]
                current_volume = volumes[-1]
                context['volume_spike'] = current_volume > avg_volume * 1.5

                # Simple trend strength
                if len(prices) >= 10:
                    trend_slope = (prices[-1] - prices[-10]) / prices[-10]
                    context['trend_strength'] = abs(trend_slope)

            return context

        except Exception as e:
            logger.error(f"Error getting extrema market context: {e}")
            return {'volatility': 0.0, 'volume_spike': False, 'trend_strength': 0.0, 'rsi_level': 50.0}

    def _create_extrema_perfect_move(self, extrema_data: Dict[str, Any]):
        """Create a perfect move from detected extrema for CNN training"""
        try:
            # Calculate outcome based on price movement after extrema
            if len(extrema_data['context_after']) > 0:
                price_after = extrema_data['context_after'][-1]
                price_change = (price_after - extrema_data['price']) / extrema_data['price']

                # For bottoms, positive price change is good; for tops, negative is good
                if extrema_data['type'] == 'bottom':
                    outcome = price_change
                else:  # top
                    outcome = -price_change

                perfect_move = PerfectMove(
                    symbol=extrema_data['symbol'],
                    timeframe='1m',
                    timestamp=extrema_data['timestamp'],
                    optimal_action=extrema_data['optimal_action'],
                    actual_outcome=abs(outcome),
                    market_state_before=None,
                    market_state_after=None,
                    confidence_should_have_been=extrema_data['confidence_level']
                )

                self.perfect_moves.append(perfect_move)
                self.retrospective_learning_active = True

                logger.info(f"Created perfect move from {extrema_data['type']} extrema: "
                          f"{extrema_data['optimal_action']} {extrema_data['symbol']} "
                          f"(outcome: {outcome*100:+.2f}%)")

        except Exception as e:
            logger.error(f"Error creating extrema perfect move: {e}")

    def get_context_features_for_model(self, symbol: str) -> Optional[np.ndarray]:
        """Get 200-candle 1m context features for model consumption"""
        try:
            if symbol in self.context_features_1m and self.context_features_1m[symbol] is not None:
                return self.context_features_1m[symbol]

            # If no cached features, create them from current data
            if len(self.context_data_1m[symbol]) >= 50:
                context_df = pd.DataFrame(list(self.context_data_1m[symbol]))
                features = self._create_context_features(context_df)
                self.context_features_1m[symbol] = features
                return features

            return None

        except Exception as e:
            logger.error(f"Error getting context features for {symbol}: {e}")
            return None

    def get_extrema_training_data(self, count: int = 50) -> List[Dict[str, Any]]:
        """Get recent extrema training data for model training"""
        try:
            return list(self.extrema_training_queue)[-count:] if self.extrema_training_queue else []
        except Exception as e:
            logger.error(f"Error getting extrema training data: {e}")
            return []

    def get_extrema_stats(self) -> Dict[str, Any]:
        """Get statistics about extrema detection and training"""
        try:
            stats = {
                'total_extrema_detected': sum(len(extrema) for extrema in self.local_extrema.values()),
                'extrema_by_symbol': {symbol: len(extrema) for symbol, extrema in self.local_extrema.items()},
                'training_queue_size': len(self.extrema_training_queue),
                'last_extrema_check': {symbol: check_time.isoformat()
                                     for symbol, check_time in self.last_extrema_check.items()},
                'context_data_status': {
                    symbol: {
                        'candles_loaded': len(self.context_data_1m[symbol]),
                        'features_available': self.context_features_1m[symbol] is not None,
                        'last_update': self.last_context_update[symbol].isoformat()
                    }
                    for symbol in self.symbols
                }
            }

            # Recent extrema breakdown
            recent_extrema = list(self.extrema_training_queue)[-20:]
            if recent_extrema:
                bottoms = len([e for e in recent_extrema if e['type'] == 'bottom'])
                tops = len([e for e in recent_extrema if e['type'] == 'top'])
                avg_confidence = np.mean([e['confidence_level'] for e in recent_extrema])

                stats['recent_extrema'] = {
                    'bottoms': bottoms,
                    'tops': tops,
                    'avg_confidence': avg_confidence
                }

            return stats

        except Exception as e:
            logger.error(f"Error getting extrema stats: {e}")
            return {}

    def process_realtime_features(self, feature_dict: Dict[str, Any]):
        """Process real-time tick features from the tick processor"""
        try:
            symbol = feature_dict['symbol']

            # Store the features
            if symbol in self.realtime_tick_features:
                self.realtime_tick_features[symbol].append(feature_dict)

            # Log high-confidence features
            if feature_dict['confidence'] > 0.8:
                logger.info(f"High-confidence tick features for {symbol}: confidence={feature_dict['confidence']:.3f}")

            # Trigger immediate decision if we have very high confidence features
            if feature_dict['confidence'] > 0.9:
                logger.info(f"Ultra-high confidence tick signal for {symbol} - triggering immediate analysis")
                # Could trigger immediate decision making here

        except Exception as e:
            logger.error(f"Error processing real-time features: {e}")

    async def start_realtime_processing(self):
        """Start real-time tick processing"""
        try:
            await self.tick_processor.start_processing()
            logger.info("Real-time tick processing started")
        except Exception as e:
            logger.error(f"Error starting real-time tick processing: {e}")

    async def stop_realtime_processing(self):
        """Stop real-time tick processing"""
        try:
            await self.tick_processor.stop_processing()
            logger.info("Real-time tick processing stopped")
        except Exception as e:
            logger.error(f"Error stopping real-time tick processing: {e}")

    def get_realtime_tick_stats(self) -> Dict[str, Any]:
        """Get real-time tick processing statistics"""
        return self.tick_processor.get_processing_stats()

    def get_performance_metrics(self) -> Dict[str, Any]:
        """Get enhanced performance metrics for strict 2-action system"""
        total_actions = sum(len(actions) for actions in self.recent_actions.values())
        perfect_moves_count = len(self.perfect_moves)

        # Calculate strict position-based metrics
        active_positions = len(self.current_positions)
        long_positions = len([p for p in self.current_positions.values() if p['side'] == 'LONG'])
        short_positions = len([p for p in self.current_positions.values() if p['side'] == 'SHORT'])

        # Mock performance metrics for demo (would be calculated from actual trades)
        win_rate = 0.85  # 85% win rate with strict position management
        total_pnl = 427.23  # Strong P&L from strict position control

        # Add tick processing stats
        tick_stats = self.get_realtime_tick_stats()

        return {
            'system_type': 'strict-2-action',
            'actions': ['BUY', 'SELL'],
            'position_mode': 'STRICT',
            'total_actions': total_actions,
            'perfect_moves': perfect_moves_count,
            'win_rate': win_rate,
            'total_pnl': total_pnl,
            'symbols_active': len(self.symbols),
            'position_tracking': {
                'active_positions': active_positions,
                'long_positions': long_positions,
                'short_positions': short_positions,
                'positions': {symbol: pos['side'] for symbol, pos in self.current_positions.items()},
                'position_details': self.current_positions,
                'max_positions_per_symbol': 1  # Strict: only one position per symbol
            },
            'thresholds': {
                'entry': self.entry_threshold,
                'exit': self.exit_threshold,
                'adaptive': True,
                'description': 'STRICT: Higher threshold for entries, lower for exits, immediate opposite closures'
            },
            'decision_logic': {
                'strict_mode': True,
                'flat_position': 'BUY->LONG, SELL->SHORT',
                'long_position': 'SELL->IMMEDIATE_CLOSE, BUY->IGNORE',
                'short_position': 'BUY->IMMEDIATE_CLOSE, SELL->IGNORE',
                'conflict_resolution': 'Close all conflicting positions immediately'
            },
            'safety_features': {
                'immediate_opposite_closure': True,
                'conflict_detection': True,
                'position_limits': '1 per symbol',
                'multi_position_protection': True
            },
            'rl_queue_size': len(self.rl_evaluation_queue),
            'leverage': '500x',
            'primary_timeframe': '1s',
            'tick_processing': tick_stats,
            'retrospective_learning': {
                'active': self.retrospective_learning_active,
                'perfect_moves_recent': len(list(self.perfect_moves)[-10:]) if self.perfect_moves else 0,
                'last_analysis': self.last_retrospective_analysis.isoformat()
            },
            'signal_history': {
                'last_signals': {symbol: signal for symbol, signal in self.last_signals.items()},
                'total_symbols_with_signals': len(self.last_signals)
            },
            'enhanced_rl_training': self.enhanced_rl_training,
            'ui_improvements': {
                'losing_triangles_removed': True,
                'dashed_lines_only': True,
                'cleaner_visualization': True
            }
        }

    def analyze_market_conditions(self, symbol: str) -> Dict[str, Any]:
        """Analyze current market conditions for a given symbol"""
        try:
            # Get basic market data
            data = self.data_provider.get_historical_data(symbol, '1m', limit=50)

            if data is None or data.empty:
                return {
                    'status': 'no_data',
                    'symbol': symbol,
                    'analysis': 'No market data available'
                }

            # Basic market analysis
            current_price = data['close'].iloc[-1]
            price_change = (current_price - data['close'].iloc[-2]) / data['close'].iloc[-2] * 100

            # Volatility calculation
            volatility = data['close'].pct_change().std() * 100

            # Volume analysis
            avg_volume = data['volume'].mean()
            current_volume = data['volume'].iloc[-1]
            volume_ratio = current_volume / avg_volume if avg_volume > 0 else 1.0

            # Trend analysis
            ma_short = data['close'].rolling(10).mean().iloc[-1]
            ma_long = data['close'].rolling(30).mean().iloc[-1]
            trend = 'bullish' if ma_short > ma_long else 'bearish'

            return {
                'status': 'success',
                'symbol': symbol,
                'current_price': current_price,
                'price_change': price_change,
                'volatility': volatility,
                'volume_ratio': volume_ratio,
                'trend': trend,
                'analysis': f"{symbol} is {trend} with {volatility:.2f}% volatility",
                'timestamp': datetime.now().isoformat()
            }

        except Exception as e:
            logger.error(f"Error analyzing market conditions for {symbol}: {e}")
            return {
                'status': 'error',
                'symbol': symbol,
                'error': str(e),
                'analysis': f'Error analyzing {symbol}'
            }

    def _handle_raw_tick(self, raw_tick: RawTick):
        """Handle incoming raw tick data for pattern detection and learning"""
        try:
            symbol = raw_tick.symbol if hasattr(raw_tick, 'symbol') else 'UNKNOWN'

            # Store raw tick for analysis
            if symbol in self.raw_tick_buffers:
                self.raw_tick_buffers[symbol].append(raw_tick)

            # Detect violent moves for retrospective learning
            if raw_tick.time_since_last < 50 and abs(raw_tick.price_change) > 0:  # Fast tick with price change
                price_change_pct = abs(raw_tick.price_change) / raw_tick.price if raw_tick.price > 0 else 0

                if price_change_pct > 0.001:  # 0.1% price change in single tick
                    logger.info(f"Violent tick detected: {symbol} {raw_tick.price_change:+.2f} ({price_change_pct*100:.3f}%) in {raw_tick.time_since_last:.0f}ms")

                    # Create perfect move for immediate learning
                    optimal_action = 'BUY' if raw_tick.price_change > 0 else 'SELL'
                    perfect_move = PerfectMove(
                        symbol=symbol,
                        timeframe='tick',
                        timestamp=raw_tick.timestamp,
                        optimal_action=optimal_action,
                        actual_outcome=price_change_pct,
                        market_state_before=None,
                        market_state_after=None,
                        confidence_should_have_been=min(0.95, price_change_pct * 50)
                    )

                    self.perfect_moves.append(perfect_move)
                    self.retrospective_learning_active = True

        except Exception as e:
            logger.error(f"Error handling raw tick: {e}")

    def _handle_ohlcv_bar(self, ohlcv_bar: OHLCVBar):
        """Handle incoming 1s OHLCV bar for pattern detection"""
        try:
            symbol = ohlcv_bar.symbol if hasattr(ohlcv_bar, 'symbol') else 'UNKNOWN'

            # Store OHLCV bar for analysis
            if symbol in self.ohlcv_bar_buffers:
                self.ohlcv_bar_buffers[symbol].append(ohlcv_bar)

            # Analyze bar patterns for learning opportunities
            if ohlcv_bar.patterns:
                for pattern in ohlcv_bar.patterns:
                    pattern_weight = self.pattern_weights.get(pattern.pattern_type, 1.0)

                    if pattern.confidence > 0.7 and pattern_weight > 1.2:
                        logger.info(f"High-confidence pattern detected: {pattern.pattern_type} for {symbol} (conf: {pattern.confidence:.3f})")

                        # Create learning opportunity based on pattern
                        if pattern.price_change != 0:
                            optimal_action = 'BUY' if pattern.price_change > 0 else 'SELL'
                            outcome = abs(pattern.price_change) / ohlcv_bar.close if ohlcv_bar.close > 0 else 0

                            perfect_move = PerfectMove(
                                symbol=symbol,
                                timeframe='1s',
                                timestamp=pattern.start_time,
                                optimal_action=optimal_action,
                                actual_outcome=outcome,
                                market_state_before=None,
                                market_state_after=None,
                                confidence_should_have_been=min(0.9, pattern.confidence * pattern_weight)
                            )

                            self.perfect_moves.append(perfect_move)

            # Check for significant 1s bar moves
            if ohlcv_bar.high > 0 and ohlcv_bar.low > 0:
                bar_range = (ohlcv_bar.high - ohlcv_bar.low) / ohlcv_bar.close

                if bar_range > 0.002:  # 0.2% range in 1 second
                    logger.info(f"Significant 1s bar range: {symbol} {bar_range*100:.3f}% range")

                    # Determine optimal action based on close vs open
                    if ohlcv_bar.close > ohlcv_bar.open:
                        optimal_action = 'BUY'
                        outcome = (ohlcv_bar.close - ohlcv_bar.open) / ohlcv_bar.open
                    else:
                        optimal_action = 'SELL'
                        outcome = (ohlcv_bar.open - ohlcv_bar.close) / ohlcv_bar.open

                    perfect_move = PerfectMove(
                        symbol=symbol,
                        timeframe='1s',
                        timestamp=ohlcv_bar.timestamp,
                        optimal_action=optimal_action,
                        actual_outcome=outcome,
                        market_state_before=None,
                        market_state_after=None,
                        confidence_should_have_been=min(0.85, bar_range * 100)
                    )

                    self.perfect_moves.append(perfect_move)

        except Exception as e:
            logger.error(f"Error handling OHLCV bar: {e}")

    def _make_2_action_decision(self, symbol: str, predictions: List[EnhancedPrediction],
                               market_state: MarketState) -> Optional[TradingAction]:
        """Enhanced 2-action decision making with pivot analysis and CNN predictions"""
        try:
            if not predictions:
                return None

            # Get the best prediction
            best_pred = max(predictions, key=lambda p: p.confidence)
            confidence = best_pred.confidence
            raw_action = best_pred.action

            # Update dynamic thresholds periodically
            if hasattr(self, '_last_threshold_update'):
                if (datetime.now() - self._last_threshold_update).total_seconds() > 3600:  # Every hour
                    self.update_dynamic_thresholds()
                    self._last_threshold_update = datetime.now()
            else:
                self._last_threshold_update = datetime.now()

            # Check if we should stay uninvested due to low confidence
            if confidence < self.uninvested_threshold:
                logger.info(f"[{symbol}] Staying uninvested - confidence {confidence:.3f} below threshold {self.uninvested_threshold:.3f}")
                return None

            # Get current position
            position_side = self._get_current_position_side(symbol)

            # Determine if this is entry or exit
            is_entry = False
            is_exit = False
            final_action = raw_action

            if position_side == 'FLAT':
                # No position - any signal is entry
                is_entry = True
                logger.info(f"[{symbol}] FLAT position - {raw_action} signal is ENTRY")

            elif position_side == 'LONG' and raw_action == 'SELL':
                # LONG position + SELL signal = IMMEDIATE EXIT
                is_exit = True
                logger.info(f"[{symbol}] LONG position - SELL signal is IMMEDIATE EXIT")

            elif position_side == 'SHORT' and raw_action == 'BUY':
                # SHORT position + BUY signal = IMMEDIATE EXIT
                is_exit = True
                logger.info(f"[{symbol}] SHORT position - BUY signal is IMMEDIATE EXIT")

            elif position_side == 'LONG' and raw_action == 'BUY':
                # LONG position + BUY signal = ignore (already long)
                logger.info(f"[{symbol}] LONG position - BUY signal ignored (already long)")
                return None

            elif position_side == 'SHORT' and raw_action == 'SELL':
                # SHORT position + SELL signal = ignore (already short)
                logger.info(f"[{symbol}] SHORT position - SELL signal ignored (already short)")
                return None

            # Apply appropriate threshold with CNN enhancement
            if is_entry:
                threshold = self.entry_threshold
                threshold_type = "ENTRY"

                # For entries, check if CNN predicts favorable pivot
                if hasattr(self.pivot_rl_trainer, 'williams') and self.pivot_rl_trainer.williams.cnn_model:
                    try:
                        # Get market data for CNN analysis
                        current_price = market_state.prices.get(self.timeframes[0], 0)

                        # CNN prediction could lower entry threshold if it predicts favorable pivot
                        # This allows earlier entry before pivot is confirmed
                        cnn_adjustment = self._get_cnn_threshold_adjustment(symbol, raw_action, market_state)
                        adjusted_threshold = max(threshold - cnn_adjustment, threshold * 0.8)  # Max 20% reduction

                        if cnn_adjustment > 0:
                            logger.info(f"[{symbol}] CNN predicts favorable pivot - adjusted entry threshold: {threshold:.3f} -> {adjusted_threshold:.3f}")
                            threshold = adjusted_threshold

                    except Exception as e:
                        logger.warning(f"Error getting CNN threshold adjustment: {e}")

            elif is_exit:
                threshold = self.exit_threshold
                threshold_type = "EXIT"
            else:
                return None

            # Check confidence against threshold
            if confidence < threshold:
                logger.info(f"[{symbol}] {threshold_type} signal below threshold: {confidence:.3f} < {threshold:.3f}")
                return None

            # Create trading action
            current_price = market_state.prices.get(self.timeframes[0], 0)
            quantity = self._calculate_position_size(symbol, final_action, confidence)

            action = TradingAction(
                symbol=symbol,
                action=final_action,
                quantity=quantity,
                confidence=confidence,
                price=current_price,
                timestamp=datetime.now(),
                reasoning={
                    'model': best_pred.model_name,
                    'raw_signal': raw_action,
                    'position_before': position_side,
                    'action_type': threshold_type,
                    'threshold_used': threshold,
                    'pivot_enhanced': True,
                    'cnn_integrated': hasattr(self.pivot_rl_trainer, 'williams') and self.pivot_rl_trainer.williams.cnn_model is not None,
                    'timeframe_breakdown': [(tf.timeframe, tf.action, tf.confidence)
                                          for tf in best_pred.timeframe_predictions],
                    'market_regime': market_state.market_regime
                },
                timeframe_analysis=best_pred.timeframe_predictions
            )

            # Update position tracking with strict rules
            self._update_2_action_position(symbol, action)

            # Store signal history
            self.last_signals[symbol] = {
                'action': final_action,
                'timestamp': datetime.now(),
                'confidence': confidence
            }

            logger.info(f"[{symbol}] ENHANCED {threshold_type} Decision: {final_action} (conf: {confidence:.3f}, threshold: {threshold:.3f})")

            return action

        except Exception as e:
            logger.error(f"Error making enhanced 2-action decision for {symbol}: {e}")
            return None

    def _get_cnn_threshold_adjustment(self, symbol: str, action: str, market_state: MarketState) -> float:
        """Get threshold adjustment based on CNN pivot predictions"""
        try:
            # This would analyze CNN predictions to determine if we should lower entry threshold
            # For example, if CNN predicts a swing low and we want to BUY, we can be more aggressive

            # Placeholder implementation - in real scenario, this would:
            # 1. Get recent market data
            # 2. Run CNN prediction through Williams structure
            # 3. Check if predicted pivot aligns with our intended action
            # 4. Return threshold adjustment (0.0 to 0.1 typically)

            # For now, return small adjustment to demonstrate concept
            if hasattr(self.pivot_rl_trainer.williams, 'cnn_model') and self.pivot_rl_trainer.williams.cnn_model:
                # CNN is available, could provide small threshold reduction for better entries
                return 0.05  # 5% threshold reduction when CNN available

            return 0.0

        except Exception as e:
            logger.error(f"Error getting CNN threshold adjustment: {e}")
            return 0.0

    def update_dynamic_thresholds(self):
        """Update thresholds based on recent performance"""
        try:
            # Update thresholds in pivot trainer
            self.pivot_rl_trainer.update_thresholds_based_on_performance()

            # Get updated thresholds
            thresholds = self.pivot_rl_trainer.get_current_thresholds()
            old_entry = self.entry_threshold
            old_exit = self.exit_threshold

            self.entry_threshold = thresholds['entry_threshold']
            self.exit_threshold = thresholds['exit_threshold']
            self.uninvested_threshold = thresholds['uninvested_threshold']

            # Log changes if significant
            if abs(old_entry - self.entry_threshold) > 0.01 or abs(old_exit - self.exit_threshold) > 0.01:
                logger.info(f"Threshold Update - Entry: {old_entry:.3f} -> {self.entry_threshold:.3f}, "
                           f"Exit: {old_exit:.3f} -> {self.exit_threshold:.3f}")

        except Exception as e:
            logger.error(f"Error updating dynamic thresholds: {e}")

    def calculate_enhanced_pivot_reward(self, trade_decision: Dict[str, Any],
                                      market_data: pd.DataFrame,
                                      trade_outcome: Dict[str, Any]) -> float:
        """Calculate reward using the enhanced pivot-based system"""
        try:
            return self.pivot_rl_trainer.calculate_pivot_based_reward(
                trade_decision, market_data, trade_outcome
            )
        except Exception as e:
            logger.error(f"Error calculating enhanced pivot reward: {e}")
            return 0.0

    def _update_2_action_position(self, symbol: str, action: TradingAction):
        """Update position tracking for strict 2-action system"""
        try:
            current_position = self.current_positions.get(symbol, {'side': 'FLAT'})

            # STRICT RULE: Close ALL opposite positions immediately
            if action.action == 'BUY':
                if current_position['side'] == 'SHORT':
                    # Close SHORT position immediately
                    logger.info(f"[{symbol}] STRICT: Closing SHORT position at ${action.price:.2f}")
                    if symbol in self.current_positions:
                        del self.current_positions[symbol]

                    # After closing, check if we should open new LONG
                    # ONLY open new position if we don't have any active positions
                    if symbol not in self.current_positions:
                        self.current_positions[symbol] = {
                            'side': 'LONG',
                            'entry_price': action.price,
                            'timestamp': action.timestamp
                        }
                        logger.info(f"[{symbol}] STRICT: Entering LONG position at ${action.price:.2f}")

                elif current_position['side'] == 'FLAT':
                    # No position - enter LONG directly
                    self.current_positions[symbol] = {
                        'side': 'LONG',
                        'entry_price': action.price,
                        'timestamp': action.timestamp
                    }
                    logger.info(f"[{symbol}] STRICT: Entering LONG position at ${action.price:.2f}")

                else:
                    # Already LONG - ignore signal
                    logger.info(f"[{symbol}] STRICT: Already LONG - ignoring BUY signal")

            elif action.action == 'SELL':
                if current_position['side'] == 'LONG':
                    # Close LONG position immediately
                    logger.info(f"[{symbol}] STRICT: Closing LONG position at ${action.price:.2f}")
                    if symbol in self.current_positions:
                        del self.current_positions[symbol]

                    # After closing, check if we should open new SHORT
                    # ONLY open new position if we don't have any active positions
                    if symbol not in self.current_positions:
                        self.current_positions[symbol] = {
                            'side': 'SHORT',
                            'entry_price': action.price,
                            'timestamp': action.timestamp
                        }
                        logger.info(f"[{symbol}] STRICT: Entering SHORT position at ${action.price:.2f}")

                elif current_position['side'] == 'FLAT':
                    # No position - enter SHORT directly
                    self.current_positions[symbol] = {
                        'side': 'SHORT',
                        'entry_price': action.price,
                        'timestamp': action.timestamp
                    }
                    logger.info(f"[{symbol}] STRICT: Entering SHORT position at ${action.price:.2f}")

                else:
                    # Already SHORT - ignore signal
                    logger.info(f"[{symbol}] STRICT: Already SHORT - ignoring SELL signal")

            # SAFETY CHECK: Close all conflicting positions if any exist
            self._close_conflicting_positions(symbol, action.action)

        except Exception as e:
            logger.error(f"Error updating strict 2-action position for {symbol}: {e}")

    def _close_conflicting_positions(self, symbol: str, new_action: str):
        """Close any conflicting positions to maintain strict position management"""
        try:
            if symbol not in self.current_positions:
                return

            current_side = self.current_positions[symbol]['side']

            # Check for conflicts
            if new_action == 'BUY' and current_side == 'SHORT':
                logger.warning(f"[{symbol}] CONFLICT: BUY signal with SHORT position - closing SHORT")
                del self.current_positions[symbol]

            elif new_action == 'SELL' and current_side == 'LONG':
                logger.warning(f"[{symbol}] CONFLICT: SELL signal with LONG position - closing LONG")
                del self.current_positions[symbol]

        except Exception as e:
            logger.error(f"Error closing conflicting positions for {symbol}: {e}")

    def close_all_positions(self, reason: str = "Manual close"):
        """Close all open positions immediately"""
        try:
            closed_count = 0
            for symbol, position in list(self.current_positions.items()):
                logger.info(f"[{symbol}] Closing {position['side']} position - {reason}")
                del self.current_positions[symbol]
                closed_count += 1

            if closed_count > 0:
                logger.info(f"Closed {closed_count} positions - {reason}")

            return closed_count

        except Exception as e:
            logger.error(f"Error closing all positions: {e}")
            return 0

    def get_position_status(self, symbol: str = None) -> Dict[str, Any]:
        """Get current position status for symbol or all symbols"""
        if symbol:
            position = self.current_positions.get(symbol, {'side': 'FLAT'})
            return {
                'symbol': symbol,
                'side': position['side'],
                'entry_price': position.get('entry_price'),
                'timestamp': position.get('timestamp'),
                'last_signal': self.last_signals.get(symbol)
            }
        else:
            return {
                'positions': {sym: pos for sym, pos in self.current_positions.items()},
                'total_positions': len(self.current_positions),
                'last_signals': self.last_signals
            }