Mr8bit commited on
Commit
e854013
·
verified ·
1 Parent(s): 69f3d8f

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. config.json +82 -0
  2. critic.pth +3 -0
  3. critic_target.pth +3 -0
  4. log_alpha.pth +3 -0
  5. policy.pth +3 -0
config.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "env": {
3
+ "name": "tensoraerospace.envs.b747_vec_torch.ImprovedB747VecEnvTorch",
4
+ "params": {
5
+ "num_envs": 128,
6
+ "dt": 0.1,
7
+ "tn": 20.0,
8
+ "initial_state": [
9
+ 0.0,
10
+ 0.0,
11
+ 0.0,
12
+ 0.0
13
+ ],
14
+ "device": "mps",
15
+ "seed": 0,
16
+ "auto_reset": true,
17
+ "include_reference_in_obs": true,
18
+ "step_randomization": {
19
+ "signal_type": "step",
20
+ "amplitude_deg_range": [
21
+ -5.0,
22
+ 5.0
23
+ ],
24
+ "min_abs_amplitude_deg": 0.1,
25
+ "step_time_sec_range": [
26
+ 1,
27
+ 15
28
+ ],
29
+ "frequency_hz_range": [
30
+ 0.02,
31
+ 0.1
32
+ ],
33
+ "p_step": 0.5,
34
+ "p_sine": 0.3,
35
+ "ref_change_threshold_rad": 0.0017453292519943296,
36
+ "min_step_amp_rad": 0.008726646259971648
37
+ },
38
+ "reward_mode": "tracking",
39
+ "survival_bonus": 0.0,
40
+ "completion_bonus": 0.0,
41
+ "early_termination_penalty": 0.0,
42
+ "early_termination_penalty_per_step": 0.0
43
+ }
44
+ },
45
+ "policy": {
46
+ "name": "tensoraerospace.agent.dsac.dsac_flight.DSAC",
47
+ "params": {
48
+ "gamma": 0.995,
49
+ "tau": 0.005,
50
+ "alpha": 0.03246142342686653,
51
+ "updates_per_step": 4,
52
+ "target_update_interval": 1,
53
+ "batch_size": 256,
54
+ "automatic_entropy_tuning": true,
55
+ "target_entropy_scale": 1.0,
56
+ "min_alpha": 0.0,
57
+ "exploration_noise_std": 0.0,
58
+ "reward_clip": 20.0,
59
+ "num_quantiles": 8,
60
+ "num_quantiles_exp": 8,
61
+ "embedding_dim": 64,
62
+ "hidden_layers": [
63
+ 64,
64
+ 64
65
+ ],
66
+ "huber_threshold": 1.0,
67
+ "learning_starts": 100000,
68
+ "warmup_action_scale": 1.0,
69
+ "caps_lambda_smoothness": 0.0,
70
+ "caps_lambda_temporal": 0.0,
71
+ "caps_noise_std": 0.05,
72
+ "risk_distortion": "neutral",
73
+ "risk_measure": 1.0,
74
+ "device": "mps",
75
+ "lr": 0.00044,
76
+ "policy_lr": 0.00044,
77
+ "log_every_updates": 200,
78
+ "seed": 0,
79
+ "log_dir": "runs/dsac_b747_step_response_20260106_021709"
80
+ }
81
+ }
82
+ }
critic.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85d869d815cff0f700934b671dc12d9f96e9696c15a73c0305d8bcfd46089ec8
3
+ size 153405
critic_target.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d26b1cbd57ac3f6d9ab64504afa117362c2cc18a03525675301d161d5521d0d
3
+ size 156159
log_alpha.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f7d38a0f3e2a7a86c451563ed5bec3abaa5ea762e5ec4734a26b4d1b1210cc2
3
+ size 1591
policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:799e5d023345ca19c8f290d4f84024abcc72d2331d28ce2b7d4a6bd9584f5792
3
+ size 58333