merge training system

This commit is contained in:
Dobromir Popov
2025-08-23 16:27:05 +03:00
parent 81749ee18e
commit f86457fc38
8 changed files with 166 additions and 8 deletions

View File

@@ -162,8 +162,8 @@ training:
# RL specific training
rl_training_interval: 300 # Train RL every 5 minutes (was 1 hour)
min_experiences: 50 # Reduced from 100 for faster learning
training_steps_per_cycle: 20 # Increased from 10 for more learning
min_experiences: 16 # Lowered to trigger replay sooner in cold-start
training_steps_per_cycle: 32 # More steps per cycle to use GPU effectively
model_type: "optimized_short_term"
use_realtime: true