File size: 1,060 Bytes
8bcb60f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 | # LILITH-Base Configuration
# ~150M parameters, balanced performance
model:
variant: base
hidden_dim: 256
num_heads: 8
ffn_dim: 1024
# Input/Output
input_features: 7
output_features: 3
sequence_length: 30
forecast_length: 90
# Component depths
gat_layers: 3
temporal_layers: 6
sfno_layers: 4
# Grid configuration
use_grid: true
nlat: 64
nlon: 128
# Features
use_climate_embed: true
use_solar_position: true
use_flash_attention: true
use_rope: true
# Ensemble
ensemble_method: gaussian
ensemble_members: 10
# Regularization
dropout: 0.1
# Memory optimization
gradient_checkpointing: true
training:
learning_rate: 1e-4
weight_decay: 0.01
max_grad_norm: 1.0
warmup_steps: 1000
max_steps: 100000
batch_size: 8
gradient_accumulation_steps: 4
use_amp: true
amp_dtype: float16
curriculum_enabled: true
curriculum_stages: [7, 14, 30, 60, 90]
curriculum_switch_steps: [10000, 30000, 60000, 80000]
inference:
quantization: dynamic_int8
batch_size: 16
max_stations: 200
|