amewebstudio commited on
Commit
11a906a
·
verified ·
1 Parent(s): adc8731

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +121 -0
config.json ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "2.0",
3
+ "codename": "WorldSim-Cognitive",
4
+ "d_model": 512,
5
+ "d_ff": 2048,
6
+ "n_layers": 8,
7
+ "n_heads": 8,
8
+ "dropout": 0.1,
9
+ "latent_dim": 256,
10
+ "latent_state_dim": 256,
11
+ "action_dim": 5,
12
+ "max_seq_len": 512,
13
+ "context_length": 16,
14
+ "prediction_horizon": 8,
15
+ "encoder_channels": [
16
+ 32,
17
+ 64,
18
+ 128,
19
+ 256
20
+ ],
21
+ "decoder_channels": [
22
+ 256,
23
+ 128,
24
+ 64,
25
+ 32
26
+ ],
27
+ "kl_weight": 0.0001,
28
+ "use_lpol": true,
29
+ "memory_size": 512,
30
+ "memory_k": 8,
31
+ "domain_types": [
32
+ "physics",
33
+ "spatial",
34
+ "temporal",
35
+ "causal",
36
+ "agent",
37
+ "object",
38
+ "zone",
39
+ "action",
40
+ "reward"
41
+ ],
42
+ "use_gqa": true,
43
+ "gqa_num_heads": 8,
44
+ "gqa_num_kv_groups": 2,
45
+ "multi_scale_enabled": true,
46
+ "st_decay": 0.9,
47
+ "lt_decay": 0.99,
48
+ "episodic_size": 256,
49
+ "episodic_dim": 128,
50
+ "structural_dim": 64,
51
+ "structural_decay": 0.95,
52
+ "expert_types": [
53
+ "Physics",
54
+ "Spatial",
55
+ "Temporal",
56
+ "Causal",
57
+ "Prediction",
58
+ "Planning"
59
+ ],
60
+ "max_experts": 12,
61
+ "growth_threshold_coherence": 0.3,
62
+ "growth_patience": 10,
63
+ "neurogenesis_enabled": true,
64
+ "min_neurons_per_layer": 32,
65
+ "max_neurons_per_layer": 256,
66
+ "neuron_birth_threshold": 0.8,
67
+ "neuron_death_threshold": 0.05,
68
+ "energy_cost_think": 0.02,
69
+ "energy_cost_dream": 0.1,
70
+ "energy_regeneration": 0.05,
71
+ "dream_enabled": true,
72
+ "dream_cycle_length": 50,
73
+ "dream_duration": 10,
74
+ "prioritized_replay": true,
75
+ "internal_state_dim": 128,
76
+ "tension_integration_rate": 0.1,
77
+ "world_state_dim": 128,
78
+ "world_update_rate": 0.1,
79
+ "world_domains": [
80
+ "physical",
81
+ "social",
82
+ "abstract",
83
+ "temporal"
84
+ ],
85
+ "physics_components": 8,
86
+ "physics_hidden": 256,
87
+ "batch_size": 32,
88
+ "learning_rate": 0.0001,
89
+ "epochs": 6,
90
+ "push_to_hub": true,
91
+ "hub_model_id": "amewebstudio/nexus-worldmodel-v2",
92
+ "world": {
93
+ "width": 64,
94
+ "height": 64,
95
+ "channels": 3,
96
+ "gravity": 0.1,
97
+ "friction": 0.98,
98
+ "bounce": 0.8,
99
+ "max_velocity": 5.0,
100
+ "max_agents": 5,
101
+ "max_obstacles": 10,
102
+ "max_zones": 3,
103
+ "agent_radius": 2.0,
104
+ "dt": 1.0
105
+ },
106
+ "_name_or_path": "amewebstudio/nexus-worldmodel-v2",
107
+ "architectures": [
108
+ "NexusWorldModel"
109
+ ],
110
+ "model_type": "nexus-worldmodel",
111
+ "auto_map": {
112
+ "AutoModel": "modeling_nexus_worldmodel.NexusWorldModel",
113
+ "AutoConfig": "configuration_nexus_worldmodel.NexusWorldModelConfig"
114
+ },
115
+ "training_info": {
116
+ "epochs": 6,
117
+ "final_loss": 0.01724659317859717,
118
+ "neurogenesis_events": 0,
119
+ "parameters": 227991690
120
+ }
121
+ }