qgallouedec HF Staff commited on
Commit
8baf463
·
1 Parent(s): c48a56a

Upload . with huggingface_hub

Browse files
.summary/0/events.out.tfevents.1678297845.qgallouedec-MS-7C84 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2836d6f83bdd97fb224a50435a46023ef41f74e3c711cce678b3e2d48e325b7d
3
+ size 67266
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: hand-insert-v2
16
  metrics:
17
  - type: mean_reward
18
- value: 2267.66 +/- 2222.12
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: hand-insert-v2
16
  metrics:
17
  - type: mean_reward
18
+ value: 12.85 +/- 5.03
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000000224_114688_reward_147.069.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33e5942b92ad2a181416b6b51e681802b3057bcd32c79d3dd30a12706d398ff3
3
+ size 98239
checkpoint_p0/checkpoint_000000456_233472.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20fed33ec75095ab20b7ac281215c7a1dca17ab295b893b99dddbdbcb4d26673
3
+ size 98567
checkpoint_p0/checkpoint_000000696_356352.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d5ccf9a64aedfb8fc1d7e46638d7ce2e804d143f6e3c4e5162e37185f881793
3
+ size 98567
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "env": "hand-insert-v2",
5
  "experiment": "hand-insert-v2",
6
  "train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
7
- "restart_behavior": "resume",
8
  "device": "cpu",
9
  "seed": null,
10
  "num_policies": 1,
@@ -24,7 +24,7 @@
24
  "recurrence": 1,
25
  "shuffle_minibatches": false,
26
  "gamma": 0.99,
27
- "reward_scale": 0.01,
28
  "reward_clip": 1000.0,
29
  "value_bootstrap": true,
30
  "normalize_returns": true,
@@ -120,17 +120,15 @@
120
  "pbt_target_objective": "true_objective",
121
  "pbt_perturb_min": 1.1,
122
  "pbt_perturb_max": 1.5,
123
- "command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld --train_for_env_steps 100000000 --reward_scale 0.01",
124
  "cli_args": {
125
  "env": "hand-insert-v2",
126
  "experiment": "hand-insert-v2",
127
- "reward_scale": 0.01,
128
- "train_for_env_steps": 100000000,
129
  "with_wandb": true,
130
  "wandb_user": "qgallouedec",
131
  "wandb_project": "sample_facotry_metaworld"
132
  },
133
- "git_hash": "44aa76c42f03edbe61877f2b20879ac5319e5842",
134
  "git_repo_name": "https://github.com/huggingface/gia",
135
- "wandb_unique_id": "hand-insert-v2_20230308_153436_728632"
136
  }
 
4
  "env": "hand-insert-v2",
5
  "experiment": "hand-insert-v2",
6
  "train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
7
+ "restart_behavior": "restart",
8
  "device": "cpu",
9
  "seed": null,
10
  "num_policies": 1,
 
24
  "recurrence": 1,
25
  "shuffle_minibatches": false,
26
  "gamma": 0.99,
27
+ "reward_scale": 0.1,
28
  "reward_clip": 1000.0,
29
  "value_bootstrap": true,
30
  "normalize_returns": true,
 
120
  "pbt_target_objective": "true_objective",
121
  "pbt_perturb_min": 1.1,
122
  "pbt_perturb_max": 1.5,
123
+ "command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld",
124
  "cli_args": {
125
  "env": "hand-insert-v2",
126
  "experiment": "hand-insert-v2",
 
 
127
  "with_wandb": true,
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
+ "git_hash": "2bb8d8c9cd813ffeafaad42038b1e71364092d36",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
+ "wandb_unique_id": "hand-insert-v2_20230308_185042_269468"
134
  }
git.diff CHANGED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ diff --git a/data/envs/metaworld/train_all.sh b/data/envs/metaworld/train_all.sh
2
+ index dbf328a..c412d01 100755
3
+ --- a/data/envs/metaworld/train_all.sh
4
+ +++ b/data/envs/metaworld/train_all.sh
5
+ @@ -1,28 +1,28 @@
6
+ #!/bin/bash
7
+
8
+ ENVS=(
9
+ - assembly
10
+ - basketball
11
+ - bin-picking
12
+ - box-close
13
+ - button-press-topdown
14
+ - button-press-topdown-wall
15
+ - button-press
16
+ - button-press-wall
17
+ - coffee-button
18
+ - coffee-pull
19
+ - coffee-push
20
+ - dial-turn
21
+ - disassemble
22
+ - door-close
23
+ - door-lock
24
+ - door-open
25
+ - door-unlock
26
+ - drawer-close
27
+ - drawer-open
28
+ - faucet-close
29
+ - faucet-open
30
+ - hammer
31
+ + # assembly
32
+ + # basketball
33
+ + # bin-picking
34
+ + # box-close
35
+ + # button-press-topdown
36
+ + # button-press-topdown-wall
37
+ + # button-press
38
+ + # button-press-wall
39
+ + # coffee-button
40
+ + # coffee-pull
41
+ + # coffee-push
42
+ + # dial-turn
43
+ + # disassemble
44
+ + # door-close
45
+ + # door-lock
46
+ + # door-open
47
+ + # door-unlock
48
+ + # drawer-close
49
+ + # drawer-open
50
+ + # faucet-close
51
+ + # faucet-open
52
+ + # hammer
53
+ hand-insert
54
+ handle-press-side
55
+ handle-press
56
+ @@ -55,4 +55,5 @@ ENVS=(
57
+
58
+ for ENV in "${ENVS[@]}"; do
59
+ python train.py --env $ENV-v2 --experiment $ENV-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld
60
+ + python enjoy.py --algo=APPO --env $ENV-v2 --experiment $ENV-v2 --train_dir=./train_dir --max_num_episodes=10 --push_to_hub --hf_repository=qgallouedec/sample-factory-$ENV-v2 --save_video --no_render --enjoy_script=enjoy --train_script=train --load_checkpoint_kind best
61
+ done
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b92a870963b0ae5689f23bcdc7107c9f09bf93f252cada23fae29eb71648fa93
3
- size 2182118
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f119d516d12805f1f08703d15334d766c9c035ea58e09cd30be4bf7cfe43e2f
3
+ size 2668517
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff