File size: 1,067 Bytes
8bcb60f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 | # LILITH-Tiny Configuration
# ~50M parameters, suitable for RTX 3060 inference
model:
variant: tiny
hidden_dim: 128
num_heads: 4
ffn_dim: 512
# Input/Output
input_features: 7
output_features: 3
sequence_length: 30
forecast_length: 90
# Component depths
gat_layers: 2
temporal_layers: 4
sfno_layers: 2
# Grid configuration
use_grid: true
nlat: 32
nlon: 64
# Features
use_climate_embed: true
use_solar_position: true
use_flash_attention: true
use_rope: true
# Ensemble
ensemble_method: gaussian
ensemble_members: 10
# Regularization
dropout: 0.1
# Memory optimization
gradient_checkpointing: false
training:
learning_rate: 2e-4
weight_decay: 0.01
max_grad_norm: 1.0
warmup_steps: 500
max_steps: 50000
batch_size: 16
gradient_accumulation_steps: 2
use_amp: true
amp_dtype: float16
curriculum_enabled: true
curriculum_stages: [7, 14, 30, 60, 90]
curriculum_switch_steps: [5000, 15000, 30000, 40000]
inference:
quantization: dynamic_int8
batch_size: 32
max_stations: 100
|