beef up T model

This commit is contained in:
Dobromir Popov
2025-07-02 01:26:07 +03:00
parent 0c8ae823ba
commit 8645f6e8dd
3 changed files with 156 additions and 75 deletions

View File

@ -239,14 +239,17 @@ class CleanTradingDashboard:
from NN.models.advanced_transformer_trading import create_trading_transformer, TradingTransformerConfig
config = TradingTransformerConfig(
d_model=256,
n_heads=8,
n_layers=4,
seq_len=50,
d_model=1024, # 2x increase for 46M parameters
n_heads=16, # 2x increase
n_layers=12, # 2x increase
seq_len=150, # 1.5x increase
n_actions=3,
use_multi_scale_attention=True,
use_market_regime_detection=True,
use_uncertainty_estimation=True
use_uncertainty_estimation=True,
use_deep_attention=True,
use_residual_connections=True,
use_layer_norm_variants=True
)
model, trainer = create_trading_transformer(config)
@ -4600,14 +4603,17 @@ class CleanTradingDashboard:
# Create transformer if not exists
if transformer_model is None or transformer_trainer is None:
config = TradingTransformerConfig(
d_model=256,
n_heads=8,
n_layers=4,
seq_len=50,
d_model=1024, # 2x increase for 46M parameters
n_heads=16, # 2x increase
n_layers=12, # 2x increase
seq_len=150, # 1.5x increase
n_actions=3,
use_multi_scale_attention=True,
use_market_regime_detection=True,
use_uncertainty_estimation=True
use_uncertainty_estimation=True,
use_deep_attention=True,
use_residual_connections=True,
use_layer_norm_variants=True
)
transformer_model, transformer_trainer = create_trading_transformer(config)