more agressive trading avtions. audit

2025-07-02 00:52:50 +03:00
parent c267657456
commit 0f155b319c
8 changed files with 292 additions and 61 deletions
--- a/NN/models/dqn_agent.py
+++ b/NN/models/dqn_agent.py
@@ -308,9 +308,9 @@ class DQNAgent:
        self.position_entry_price = 0.0
        self.position_entry_time = None
-        # Different thresholds for entry vs exit decisions
+        # Different thresholds for entry vs exit decisions - AGGRESSIVE for more training data
-        self.entry_confidence_threshold = 0.7   # High threshold for new positions
+        self.entry_confidence_threshold = 0.35  # Lower threshold for new positions (was 0.7)
-        self.exit_confidence_threshold = 0.3    # Lower threshold for closing positions
+        self.exit_confidence_threshold = 0.15   # Very low threshold for closing positions (was 0.3)
        self.uncertainty_threshold = 0.1        # When to stay neutral
    def move_models_to_device(self, device=None):
--- a/NN/models/saved/checkpoint_metadata.json
+++ b/NN/models/saved/checkpoint_metadata.json
@@ -270,6 +270,46 @@
    }
  ],
  "decision": [
    {
      "checkpoint_id": "decision_20250702_004748",
      "model_name": "decision",
      "model_type": "decision_fusion",
      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004748.pt",
      "created_at": "2025-07-02T00:47:48.854145",
      "file_size_mb": 0.06720924377441406,
      "performance_score": 9.886663671782506,
      "accuracy": null,
      "loss": 0.11333632821749363,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
      "pnl": null,
      "epoch": null,
      "training_time_hours": null,
      "total_parameters": null,
      "wandb_run_id": null,
      "wandb_artifact_name": null
    },
    {
      "checkpoint_id": "decision_20250702_004755",
      "model_name": "decision",
      "model_type": "decision_fusion",
      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004755.pt",
      "created_at": "2025-07-02T00:47:55.370225",
      "file_size_mb": 0.06720924377441406,
      "performance_score": 9.885944298352115,
      "accuracy": null,
      "loss": 0.11405570164788514,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
      "pnl": null,
      "epoch": null,
      "training_time_hours": null,
      "total_parameters": null,
      "wandb_run_id": null,
      "wandb_artifact_name": null
    },
    {
      "checkpoint_id": "decision_20250702_004715",
      "model_name": "decision",
@@ -291,15 +331,15 @@
      "wandb_artifact_name": null
    },
    {
-      "checkpoint_id": "decision_20250702_004715",
+      "checkpoint_id": "decision_20250702_004743",
      "model_name": "decision",
      "model_type": "decision_fusion",
-      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004715.pt",
+      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004743.pt",
-      "created_at": "2025-07-02T00:47:15.477601",
+      "created_at": "2025-07-02T00:47:43.587679",
      "file_size_mb": 0.06720924377441406,
-      "performance_score": 9.86977519926482,
+      "performance_score": 9.884886049948234,
      "accuracy": null,
-      "loss": 0.13022480073517986,
+      "loss": 0.11511395005176642,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
@@ -311,55 +351,15 @@
      "wandb_artifact_name": null
    },
    {
-      "checkpoint_id": "decision_20250702_004714",
+      "checkpoint_id": "decision_20250702_004740",
      "model_name": "decision",
      "model_type": "decision_fusion",
-      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004714.pt",
+      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004740.pt",
-      "created_at": "2025-07-02T00:47:14.411371",
+      "created_at": "2025-07-02T00:47:40.475946",
      "file_size_mb": 0.06720924377441406,
-      "performance_score": 9.869006871279064,
+      "performance_score": 9.884665936331398,
      "accuracy": null,
-      "loss": 0.13099312872093702,
+      "loss": 0.11533406366860229,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
      "pnl": null,
      "epoch": null,
      "training_time_hours": null,
      "total_parameters": null,
      "wandb_run_id": null,
      "wandb_artifact_name": null
    },
    {
      "checkpoint_id": "decision_20250702_004716",
      "model_name": "decision",
      "model_type": "decision_fusion",
      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004716.pt",
      "created_at": "2025-07-02T00:47:16.582136",
      "file_size_mb": 0.06720924377441406,
      "performance_score": 9.86168809807194,
      "accuracy": null,
      "loss": 0.1383119019280587,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
      "pnl": null,
      "epoch": null,
      "training_time_hours": null,
      "total_parameters": null,
      "wandb_run_id": null,
      "wandb_artifact_name": null
    },
    {
      "checkpoint_id": "decision_20250702_004716",
      "model_name": "decision",
      "model_type": "decision_fusion",
      "file_path": "NN\\models\\saved\\decision\\decision_20250702_004716.pt",
      "created_at": "2025-07-02T00:47:16.828698",
      "file_size_mb": 0.06720924377441406,
      "performance_score": 9.861469801648386,
      "accuracy": null,
      "loss": 0.13853019835161312,
      "val_accuracy": null,
      "val_loss": null,
      "reward": null,
--- a/core/orchestrator.py
+++ b/core/orchestrator.py
@@ -72,9 +72,9 @@ class TradingOrchestrator:
        self.model_registry = model_registry or get_model_registry()
        self.enhanced_rl_training = enhanced_rl_training
-        # Configuration
+        # Configuration - AGGRESSIVE for more training data
-        self.confidence_threshold = self.config.orchestrator.get('confidence_threshold', 0.20)
+        self.confidence_threshold = self.config.orchestrator.get('confidence_threshold', 0.15)  # Lowered from 0.20
-        self.confidence_threshold_close = self.config.orchestrator.get('confidence_threshold_close', 0.10)
+        self.confidence_threshold_close = self.config.orchestrator.get('confidence_threshold_close', 0.08)  # Lowered from 0.10
        self.decision_frequency = self.config.orchestrator.get('decision_frequency', 30)
        self.symbols = self.config.get('symbols', ['ETH/USDT', 'BTC/USDT'])  # Enhanced to support multiple symbols
--- a/core/realtime_rl_cob_trader.py
+++ b/core/realtime_rl_cob_trader.py
@@ -103,7 +103,7 @@ class RealtimeRLCOBTrader:
                 trading_executor: TradingExecutor = None,
                 model_checkpoint_dir: str = "models/realtime_rl_cob",
                 inference_interval_ms: int = 200,
-                 min_confidence_threshold: float = 0.7,
+                 min_confidence_threshold: float = 0.35,  # Lowered from 0.7 for more aggressive trading
                 required_confident_predictions: int = 3):
        self.symbols = symbols or ['BTC/USDT', 'ETH/USDT']
--- a/core/training_integration.py
+++ b/core/training_integration.py
@@ -22,7 +22,7 @@ class TrainingIntegration:
    def __init__(self, orchestrator=None):
        self.orchestrator = orchestrator
        self.training_sessions = {}
-        self.min_confidence_threshold = 0.3
+        self.min_confidence_threshold = 0.15  # Lowered from 0.3 for more aggressive training
        logger.info("TrainingIntegration initialized")
--- a/reports/AGGRESSIVE_TRADING_THRESHOLDS_SUMMARY.md
+++ b/reports/AGGRESSIVE_TRADING_THRESHOLDS_SUMMARY.md
@@ -0,0 +1,65 @@
 # Aggressive Trading Thresholds Summary
 ## Overview
 Lowered confidence thresholds across the entire trading system to execute trades more aggressively, generating more training data for the checkpoint-enabled models.
 ## Changes Made
 ### 1. Clean Dashboard (`web/clean_dashboard.py`)
 - **CLOSE_POSITION_THRESHOLD**: `0.25` → `0.15` (40% reduction)
 - **OPEN_POSITION_THRESHOLD**: `0.60` → `0.35` (42% reduction)
 ### 2. DQN Agent (`NN/models/dqn_agent.py`)
 - **entry_confidence_threshold**: `0.7` → `0.35` (50% reduction)
 - **exit_confidence_threshold**: `0.3` → `0.15` (50% reduction)
 ### 3. Trading Orchestrator (`core/orchestrator.py`)
 - **confidence_threshold**: `0.20` → `0.15` (25% reduction)
 - **confidence_threshold_close**: `0.10` → `0.08` (20% reduction)
 ### 4. Realtime RL COB Trader (`core/realtime_rl_cob_trader.py`)
 - **min_confidence_threshold**: `0.7` → `0.35` (50% reduction)
 ### 5. Training Integration (`core/training_integration.py`)
 - **min_confidence_threshold**: `0.3` → `0.15` (50% reduction)
 ## Expected Impact
 ### More Aggressive Trading
 - **Entry Thresholds**: Now require only 35% confidence to open new positions (vs 60-70% previously)
 - **Exit Thresholds**: Now require only 8-15% confidence to close positions (vs 25-30% previously)
 - **Overall**: System will execute ~2-3x more trades than before
 ### Better Training Data Generation
 - **More Executed Actions**: Since we now store training progress, more executed trades = more training data
 - **Faster Learning**: Models will learn from real trading outcomes more frequently
 - **Split-Second Decisions**: With 100ms training intervals, models can adapt quickly to market changes
 ### Risk Management
 - **Position Sizing**: Small position sizes (0.005) limit risk per trade
 - **Profit Incentives**: System still has profit-based incentives for closing positions
 - **Leverage Control**: User-controlled leverage settings provide additional risk management
 ## Training Frequency
 - **Decision Fusion**: Every 100ms
 - **COB RL**: Every 100ms  
 - **DQN**: Every 30 seconds
 - **CNN**: Every 30 seconds
 ## Monitoring
 - Training performance metrics are tracked and displayed
 - Average, min, max training times are logged
 - Training frequency and total calls are monitored
 - Real-time performance feedback available in dashboard
 ## Next Steps
 1. Monitor trade execution frequency
 2. Track training data generation rate
 3. Observe model learning progress
 4. Adjust thresholds further if needed based on performance
 ## Notes
 - All changes maintain the existing profit incentive system
 - Position management logic remains intact
 - Risk controls through position sizing and leverage are preserved
 - Training checkpoint system ensures progress is not lost 
--- a/reports/PLACEHOLDER_FUNCTIONS_AUDIT.md
+++ b/reports/PLACEHOLDER_FUNCTIONS_AUDIT.md
@@ -0,0 +1,166 @@
 # Placeholder Functions Audit Report
 ## Overview
 This audit identifies functions that appear to be implemented but are actually just placeholders or mock implementations, similar to the COB training issue that caused debugging problems.
 ## Critical Placeholder Functions
 ### 1. **COB RL Training Functions** (HIGH PRIORITY)
 #### `core/training_integration.py` - Line 178
 ```python
 def _train_cob_rl_on_trade_outcome(self, trade_record: Dict[str, Any], reward: float) -> bool:
    """Train COB RL on trade outcome (placeholder)"""
    # COB RL training would go here - requires more specific implementation
    # For now, just log that we could train COB RL
    logger.debug(f"COB RL training opportunity: features={len(cob_features)}")
    return True
 ```
 **Issue**: Returns `True` but does no actual training. This was the original COB training issue.
 #### `web/clean_dashboard.py` - Line 4438
 ```python
 def _perform_real_cob_rl_training(self, market_data: List[Dict]):
    """Perform actual COB RL training with real market microstructure data"""
    # For now, create a simple checkpoint for COB RL to prevent recreation
    checkpoint_data = {
        'model_state_dict': {},  # Placeholder
        'training_samples': len(market_data),
        'cob_features_processed': True
    }
 ```
 **Issue**: Only creates placeholder checkpoints, no actual training.
 ### 2. **CNN Training Functions** (HIGH PRIORITY)
 #### `core/training_integration.py` - Line 148
 ```python
 def _train_cnn_on_trade_outcome(self, trade_record: Dict[str, Any], reward: float) -> bool:
    """Train CNN on trade outcome (placeholder)"""
    # CNN training would go here - requires more specific implementation
    # For now, just log that we could train CNN
    logger.debug(f"CNN training opportunity: features={len(cnn_features)}, predictions={len(cnn_predictions)}")
    return True
 ```
 **Issue**: Returns `True` but does no actual training.
 #### `web/clean_dashboard.py` - Line 4239
 ```python
 def _perform_real_cnn_training(self, market_data: List[Dict]):
    # Multiple issues with CNN model access and training
    model.train()  # CNNModel doesn't have train() method
    outputs = model(features_tensor)  # CNNModel is not callable
    model.losses.append(loss_value)  # CNNModel doesn't have losses attribute
 ```
 **Issue**: Tries to access non-existent CNN model methods and attributes.
 ### 3. **Dynamic Model Loading** (MEDIUM PRIORITY)
 #### `web/clean_dashboard.py` - Lines 234, 239
 ```python
 def load_model_dynamically(self, model_name: str, model_type: str, model_path: Optional[str] = None) -> bool:
    """Dynamically load a model at runtime - Not implemented in orchestrator"""
    logger.warning("Dynamic model loading not implemented in orchestrator")
    return False
 def unload_model_dynamically(self, model_name: str) -> bool:
    """Dynamically unload a model at runtime - Not implemented in orchestrator"""
    logger.warning("Dynamic model unloading not implemented in orchestrator")
    return False
 ```
 **Issue**: Always returns `False`, no actual implementation.
 ### 4. **Universal Data Stream** (LOW PRIORITY)
 #### `web/clean_dashboard.py` - Lines 76-221
 ```python
 class UnifiedDataStream:
    """Placeholder for disabled Universal Data Stream"""
    def __init__(self, *args, **kwargs):
        pass
    def register_consumer(self, *args, **kwargs):
        pass
 def _handle_unified_stream_data(self, data):
    """Placeholder for unified stream data handling."""
    pass
 ```
 **Issue**: Complete placeholder implementation.
 ### 5. **Enhanced Training System** (MEDIUM PRIORITY)
 #### `web/clean_dashboard.py` - Line 3447
 ```python
 logger.warning("Enhanced training system not available - using mock predictions")
 ```
 **Issue**: Falls back to mock predictions when enhanced training is not available.
 ## Mock Data Generation (Found in Tests)
 ### Test Files with Mock Data
 - `tests/test_tick_processor_simple.py` - Lines 51-84: Mock tick data generation
 - `tests/test_tick_processor_final.py` - Lines 228-240: Mock tick features
 - `tests/test_realtime_tick_processor.py` - Lines 234-243: Mock tick features
 - `tests/test_realtime_rl_cob_trader.py` - Lines 161-169: Mock COB data
 - `tests/test_nn_driven_trading.py` - Lines 39-65: Mock predictions
 - `tests/test_model_persistence.py` - Lines 24-54: Mock agent class
 ## Impact Analysis
 ### High Impact Issues
 1. **COB RL Training**: No actual training occurs, models don't learn from COB data
 2. **CNN Training**: No actual training occurs, models don't learn from CNN features
 3. **Model Loading**: Dynamic model management doesn't work
 ### Medium Impact Issues
 1. **Enhanced Training**: Falls back to mock predictions
 2. **Universal Data Stream**: Disabled functionality
 ### Low Impact Issues
 1. **Test Mock Data**: Only affects tests, not production
 ## Recommendations
 ### Immediate Actions (High Priority)
 1. **Implement real COB RL training** in `_perform_real_cob_rl_training()`
 2. **Fix CNN training** by implementing proper CNN model interface
 3. **Implement dynamic model loading** in orchestrator
 ### Medium Priority
 1. **Implement enhanced training system** to avoid mock predictions
 2. **Enable Universal Data Stream** if needed
 ### Low Priority
 1. **Replace test mock data** with real data generation where possible
 ## Detection Methods
 ### Code Patterns to Watch For
 1. Functions that return `True` but do nothing
 2. Functions with "placeholder" or "mock" in comments
 3. Functions that only log debug messages
 4. Functions that access non-existent attributes/methods
 5. Functions that create empty dictionaries as placeholders
 ### Testing Strategies
 1. **Unit tests** that verify actual functionality, not just return values
 2. **Integration tests** that verify training actually occurs
 3. **Monitoring** of model performance to detect when training isn't working
 4. **Log analysis** to identify placeholder function calls
 ## Prevention
 ### Development Guidelines
 1. **Never return `True`** from training functions without actual training
 2. **Always implement** core functionality before marking as complete
 3. **Use proper interfaces** for model training
 4. **Add TODO comments** for incomplete implementations
 5. **Test with real data** instead of mock data in production code
 ### Code Review Checklist
 - [ ] Training functions actually perform training
 - [ ] Model interfaces are properly implemented
 - [ ] No placeholder return values in critical functions
 - [ ] Mock data only used in tests, not production
 - [ ] All TODO/FIXME items are tracked and prioritized 
--- a/web/clean_dashboard.py
+++ b/web/clean_dashboard.py
@@ -2512,9 +2512,9 @@ class CleanTradingDashboard:
            should_execute = False
            execution_reason = ""
-            # Define confidence thresholds
+            # Define confidence thresholds - AGGRESSIVE for more training data
-            CLOSE_POSITION_THRESHOLD = 0.25  # Lower threshold to close positions
+            CLOSE_POSITION_THRESHOLD = 0.15  # Very low threshold to close positions (was 0.25)
-            OPEN_POSITION_THRESHOLD = 0.60   # Higher threshold to open new positions
+            OPEN_POSITION_THRESHOLD = 0.35   # Lower threshold to open new positions (was 0.60)
            # Calculate profit incentive for position closing
            profit_incentive = 0.0