caching system fixes

2025-11-06 16:26:38 +02:00
parent 76e3bb6a61
commit 86ae8b499b
2 changed files with 76 additions and 2 deletions
--- a/core/data_provider.py
+++ b/core/data_provider.py
@@ -2590,8 +2590,15 @@ class DataProvider:
    def _should_refresh_pivot_bounds(self, symbol: str) -> bool:
        """Check if pivot bounds need refreshing"""
        try:
            # Try to load from cache if not in memory
            if symbol not in self.pivot_bounds:
-                return True
+                cached_bounds = self._load_pivot_bounds_from_duckdb(symbol)
                if cached_bounds:
                    self.pivot_bounds[symbol] = cached_bounds
                    logger.info(f"Loaded pivot bounds from cache for {symbol}")
                    return False  # Cache is fresh, no need to refresh
                else:
                    return True  # No cache, need to refresh
            bounds = self.pivot_bounds[symbol]
            age = datetime.now() - bounds.created_timestamp
--- a/core/duckdb_storage.py
+++ b/core/duckdb_storage.py
@@ -18,6 +18,7 @@ from datetime import datetime
 from pathlib import Path
 from typing import Dict, List, Optional, Tuple, Any
 import json
 import threading
 logger = logging.getLogger(__name__)
@@ -37,6 +38,14 @@ class DuckDBStorage:
        # Connect to DuckDB
        self.conn = duckdb.connect(str(self.db_path))
        # Batch logging for compact output
        self._batch_buffer = []  # List of (symbol, timeframe, count, total) tuples
        self._batch_lock = threading.Lock()
        self._batch_flush_timer = None
        self._batch_flush_delay = 0.5  # Flush after 0.5 seconds of inactivity
        self._batch_timer_lock = threading.Lock()
        self._flush_in_progress = False
        # Initialize schema
        self._init_schema()
@@ -113,6 +122,52 @@ class DuckDBStorage:
        logger.info("DuckDB schema initialized (all data in tables)")
    def _schedule_batch_flush(self):
        """Schedule a batch flush after delay, resetting timer on each call"""
        with self._batch_timer_lock:
            # Cancel existing timer if any
            if self._batch_flush_timer:
                self._batch_flush_timer.cancel()
            # Start new timer that will flush after delay
            self._batch_flush_timer = threading.Timer(self._batch_flush_delay, self._flush_batch_log)
            self._batch_flush_timer.daemon = True
            self._batch_flush_timer.start()
    def _flush_batch_log(self):
        """Flush accumulated batch logs as a single compact line"""
        with self._batch_lock:
            if not self._batch_buffer or self._flush_in_progress:
                return
            self._flush_in_progress = True
            # Group by symbol for better readability
            symbol_groups = {}
            for symbol, timeframe, count, total in self._batch_buffer:
                if symbol not in symbol_groups:
                    symbol_groups[symbol] = []
                symbol_groups[symbol].append((timeframe, count, total))
            # Build compact log message
            parts = []
            for symbol in sorted(symbol_groups.keys()):
                symbol_parts = []
                for timeframe, count, total in sorted(symbol_groups[symbol]):
                    symbol_parts.append(f"{timeframe}({count}, total: {total})")
                parts.append(f"{symbol}: {', '.join(symbol_parts)}")
            log_msg = "Stored candles batch: " + " | ".join(parts)
            logger.info(log_msg)
            # Clear buffer and reset flag
            self._batch_buffer.clear()
            self._flush_in_progress = False
        # Clear timer reference after flushing
        with self._batch_timer_lock:
            self._batch_flush_timer = None
    def store_ohlcv_data(self, symbol: str, timeframe: str, df: pd.DataFrame) -> int:
        """
        Store OHLCV data directly in DuckDB table
@@ -177,7 +232,11 @@ class DuckDBStorage:
                VALUES (?, ?, ?, ?, ?, ?, ?)
            """, (symbol, timeframe, '', first_ts, last_ts, count, now_ts))
-            logger.info(f"Stored {len(df)} candles for {symbol} {timeframe} in DuckDB (total: {count})")
+            # Add to batch buffer instead of logging immediately
            with self._batch_lock:
                self._batch_buffer.append((symbol, timeframe, len(df), count))
                self._schedule_batch_flush()
            return len(df)
        except Exception as e:
@@ -534,6 +593,14 @@ class DuckDBStorage:
    def close(self):
        """Close database connection"""
        # Cancel any pending timer
        with self._batch_timer_lock:
            if self._batch_flush_timer:
                self._batch_flush_timer.cancel()
        # Flush any pending batch logs
        self._flush_batch_log()
        if self.conn:
            self.conn.close()
            logger.info("DuckDB connection closed")