dash and training wip

This commit is contained in:
Dobromir Popov
2025-09-02 15:30:05 +03:00
parent 443e8e746f
commit 1b54438082
14 changed files with 270 additions and 197 deletions

View File

@@ -731,7 +731,8 @@ class RealtimeRLCOBTrader:
with self.training_lock:
# Check if we have enough data for training
predictions = list(self.prediction_history[symbol])
if len(predictions) < 10:
# Train with fewer samples to kickstart learning
if len(predictions) < 6:
return
# Calculate rewards for recent predictions
@@ -739,11 +740,11 @@ class RealtimeRLCOBTrader:
# Filter predictions with calculated rewards
training_predictions = [p for p in predictions if p.reward is not None]
if len(training_predictions) < 5:
if len(training_predictions) < 3:
return
# Prepare training batch
batch_size = min(32, len(training_predictions))
batch_size = min(16, len(training_predictions))
batch_predictions = training_predictions[-batch_size:]
# Train model