checkbox manager and handling

2025-06-24 21:59:23 +03:00
parent 706eb13912
commit ab8c94d735
8 changed files with 1170 additions and 29 deletions
--- a/NN/models/cnn_model.py
+++ b/NN/models/cnn_model.py
@@ -19,6 +19,10 @@ from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_sc
 import torch.nn.functional as F
 from typing import Dict, Any, Optional, Tuple

+# Import checkpoint management
+from utils.checkpoint_manager import save_checkpoint, load_best_checkpoint
+from utils.training_integration import get_training_integration
+
 # Configure logging
 logger = logging.getLogger(__name__)

@@ -507,38 +511,140 @@ class EnhancedCNNModel(nn.Module):
        return self.to(torch.device(device))

 class CNNModelTrainer:
-    """Enhanced trainer for the beefed-up CNN model"""
+    """Enhanced CNN trainer with checkpoint management integration"""
    
-    def __init__(self, model: EnhancedCNNModel, learning_rate: float = 0.0001, device: str = 'cuda'):
-        self.model = model.to(device)
-        self.device = device
-        self.learning_rate = learning_rate
+    def __init__(self, model: EnhancedCNNModel, learning_rate: float = 0.0001, device: str = 'cuda',
+                 model_name: str = "enhanced_cnn", enable_checkpoints: bool = True):
+        self.model = model
+        self.device = torch.device(device if torch.cuda.is_available() else 'cpu')
+        self.model.to(self.device)
        
-        # Use AdamW optimizer with weight decay
-        self.optimizer = torch.optim.AdamW(
-            model.parameters(), 
-            lr=learning_rate, 
+        # Checkpoint management
+        self.model_name = model_name
+        self.enable_checkpoints = enable_checkpoints
+        self.training_integration = get_training_integration() if enable_checkpoints else None
+        self.epoch_count = 0
+        self.best_val_accuracy = 0.0
+        self.best_val_loss = float('inf')
+        self.checkpoint_frequency = 10  # Save checkpoint every 10 epochs
+        
+        # Optimizers and criteria
+        self.optimizer = optim.AdamW(
+            self.model.parameters(),
+            lr=learning_rate,
            weight_decay=0.01,
            betas=(0.9, 0.999)
        )
        
-        # Learning rate scheduler
-        self.scheduler = torch.optim.lr_scheduler.OneCycleLR(
+        self.scheduler = optim.lr_scheduler.OneCycleLR(
            self.optimizer,
            max_lr=learning_rate * 10,
-            total_steps=10000,  # Will be updated based on actual training
+            total_steps=1000,
            pct_start=0.1,
            anneal_strategy='cos'
        )
        
-        # Multi-task loss functions
+        # Loss functions
        self.main_criterion = nn.CrossEntropyLoss(label_smoothing=0.1)
-        self.confidence_criterion = nn.BCELoss()
+        self.confidence_criterion = nn.MSELoss()
        self.regime_criterion = nn.CrossEntropyLoss()
        self.volatility_criterion = nn.MSELoss()
        
-        self.training_history = []
+        # Training history
+        self.training_history = {
+            'train_loss': [],
+            'val_loss': [],
+            'train_accuracy': [],
+            'val_accuracy': [],
+            'learning_rates': []
+        }
        
+        # Load best checkpoint if available
+        if self.enable_checkpoints:
+            self.load_best_checkpoint()
+        
+        logger.info(f"CNN Trainer initialized with checkpoint management: {enable_checkpoints}")
+        if enable_checkpoints:
+            logger.info(f"Model name: {model_name}, Checkpoint frequency: {self.checkpoint_frequency}")
+    
+    def load_best_checkpoint(self):
+        """Load the best checkpoint for this CNN model"""
+        try:
+            if not self.enable_checkpoints:
+                return
+                
+            result = load_best_checkpoint(self.model_name)
+            if result:
+                file_path, metadata = result
+                checkpoint = torch.load(file_path, map_location=self.device)
+                
+                # Load model state
+                if 'model_state_dict' in checkpoint:
+                    self.model.load_state_dict(checkpoint['model_state_dict'])
+                if 'optimizer_state_dict' in checkpoint:
+                    self.optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
+                if 'scheduler_state_dict' in checkpoint:
+                    self.scheduler.load_state_dict(checkpoint['scheduler_state_dict'])
+                
+                # Load training state
+                if 'epoch_count' in checkpoint:
+                    self.epoch_count = checkpoint['epoch_count']
+                if 'best_val_accuracy' in checkpoint:
+                    self.best_val_accuracy = checkpoint['best_val_accuracy']
+                if 'best_val_loss' in checkpoint:
+                    self.best_val_loss = checkpoint['best_val_loss']
+                if 'training_history' in checkpoint:
+                    self.training_history = checkpoint['training_history']
+                
+                logger.info(f"Loaded CNN checkpoint: {metadata.checkpoint_id}")
+                logger.info(f"Epoch: {self.epoch_count}, Best val accuracy: {self.best_val_accuracy:.4f}")
+                
+        except Exception as e:
+            logger.warning(f"Failed to load checkpoint for {self.model_name}: {e}")
+    
+    def save_checkpoint(self, train_accuracy: float, val_accuracy: float, 
+                       train_loss: float, val_loss: float, force_save: bool = False):
+        """Save checkpoint if performance improved or forced"""
+        try:
+            if not self.enable_checkpoints:
+                return False
+                
+            self.epoch_count += 1
+            
+            # Update best metrics
+            improved = False
+            if val_accuracy > self.best_val_accuracy:
+                self.best_val_accuracy = val_accuracy
+                improved = True
+            if val_loss < self.best_val_loss:
+                self.best_val_loss = val_loss
+                improved = True
+            
+            # Save checkpoint if improved, forced, or at regular intervals
+            should_save = (
+                force_save or 
+                improved or
+                self.epoch_count % self.checkpoint_frequency == 0
+            )
+            
+            if should_save and self.training_integration:
+                return self.training_integration.save_cnn_checkpoint(
+                    cnn_model=self.model,
+                    model_name=self.model_name,
+                    epoch=self.epoch_count,
+                    train_accuracy=train_accuracy,
+                    val_accuracy=val_accuracy,
+                    train_loss=train_loss,
+                    val_loss=val_loss,
+                    training_time_hours=0.0  # Can be calculated by calling code
+                )
+            
+            return False
+            
+        except Exception as e:
+            logger.error(f"Error saving CNN checkpoint: {e}")
+            return False
+    
    def reset_computational_graph(self):
        """Reset the computational graph to prevent in-place operation issues"""
        try:
@@ -648,6 +754,13 @@ class CNNModelTrainer:
                accuracy = (predictions == y_train).float().mean().item()
                losses['accuracy'] = accuracy
            
+            # Update training history
+            if 'train_loss' in self.training_history:
+                self.training_history['train_loss'].append(losses['total_loss'])
+                self.training_history['train_accuracy'].append(accuracy)
+                current_lr = self.optimizer.param_groups[0]['lr']
+                self.training_history['learning_rates'].append(current_lr)
+            
            return losses
            
        except Exception as e:
--- a/NN/models/dqn_agent.py
+++ b/NN/models/dqn_agent.py
@@ -14,6 +14,10 @@ import time
 # Add parent directory to path
 sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

+# Import checkpoint management
+from utils.checkpoint_manager import save_checkpoint, load_best_checkpoint
+from utils.training_integration import get_training_integration
+
 # Configure logger
 logger = logging.getLogger(__name__)

@@ -33,7 +37,18 @@ class DQNAgent:
                 batch_size: int = 32,
                 target_update: int = 100,
                 priority_memory: bool = True,
-                 device=None):
+                 device=None,
+                 model_name: str = "dqn_agent",
+                 enable_checkpoints: bool = True):
+        
+        # Checkpoint management
+        self.model_name = model_name
+        self.enable_checkpoints = enable_checkpoints
+        self.training_integration = get_training_integration() if enable_checkpoints else None
+        self.episode_count = 0
+        self.best_reward = float('-inf')
+        self.reward_history = deque(maxlen=100)
+        self.checkpoint_frequency = 100  # Save checkpoint every 100 episodes
        
        # Extract state dimensions
        if isinstance(state_shape, tuple) and len(state_shape) > 1:
@@ -90,7 +105,91 @@ class DQNAgent:
            'confidence': 0.0,
            'raw': None
        }
-        self.extrema_memory = []  # Special memory for storing extrema points
+        self.extrema_memory = []
+        
+        # DQN hyperparameters
+        self.gamma = 0.99  # Discount factor
+        
+        # Load best checkpoint if available
+        if self.enable_checkpoints:
+            self.load_best_checkpoint()
+        
+        logger.info(f"DQN Agent initialized with checkpoint management: {enable_checkpoints}")
+        if enable_checkpoints:
+            logger.info(f"Model name: {model_name}, Checkpoint frequency: {self.checkpoint_frequency}")
+    
+    def load_best_checkpoint(self):
+        """Load the best checkpoint for this DQN agent"""
+        try:
+            if not self.enable_checkpoints:
+                return
+                
+            result = load_best_checkpoint(self.model_name)
+            if result:
+                file_path, metadata = result
+                checkpoint = torch.load(file_path, map_location=self.device)
+                
+                # Load model states
+                if 'policy_net_state_dict' in checkpoint:
+                    self.policy_net.load_state_dict(checkpoint['policy_net_state_dict'])
+                if 'target_net_state_dict' in checkpoint:
+                    self.target_net.load_state_dict(checkpoint['target_net_state_dict'])
+                if 'optimizer_state_dict' in checkpoint:
+                    self.optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
+                
+                # Load training state
+                if 'episode_count' in checkpoint:
+                    self.episode_count = checkpoint['episode_count']
+                if 'epsilon' in checkpoint:
+                    self.epsilon = checkpoint['epsilon']
+                if 'best_reward' in checkpoint:
+                    self.best_reward = checkpoint['best_reward']
+                
+                logger.info(f"Loaded DQN checkpoint: {metadata.checkpoint_id}")
+                logger.info(f"Episode: {self.episode_count}, Best reward: {self.best_reward:.4f}")
+                
+        except Exception as e:
+            logger.warning(f"Failed to load checkpoint for {self.model_name}: {e}")
+    
+    def save_checkpoint(self, episode_reward: float, force_save: bool = False):
+        """Save checkpoint if performance improved or forced"""
+        try:
+            if not self.enable_checkpoints:
+                return False
+                
+            self.episode_count += 1
+            self.reward_history.append(episode_reward)
+            
+            # Calculate average reward over recent episodes
+            avg_reward = sum(self.reward_history) / len(self.reward_history)
+            
+            # Update best reward
+            if episode_reward > self.best_reward:
+                self.best_reward = episode_reward
+            
+            # Save checkpoint every N episodes or if forced
+            should_save = (
+                force_save or 
+                self.episode_count % self.checkpoint_frequency == 0 or
+                episode_reward > self.best_reward * 0.95  # Within 5% of best
+            )
+            
+            if should_save and self.training_integration:
+                return self.training_integration.save_rl_checkpoint(
+                    rl_agent=self,
+                    model_name=self.model_name,
+                    episode=self.episode_count,
+                    avg_reward=avg_reward,
+                    best_reward=self.best_reward,
+                    epsilon=self.epsilon,
+                    total_pnl=0.0  # Default to 0, can be set by calling code
+                )
+            
+            return False
+            
+        except Exception as e:
+            logger.error(f"Error saving DQN checkpoint: {e}")
+            return False
        
        # Price prediction tracking
        self.last_price_pred = {
@@ -117,7 +216,6 @@ class DQNAgent:
        # Performance tracking
        self.losses = []
        self.avg_reward = 0.0
-        self.best_reward = -float('inf')
        self.no_improvement_count = 0
        
        # Confidence tracking