qgallouedec HF Staff commited on
Commit
952a097
·
1 Parent(s): 8baf463

Upload . with huggingface_hub

Browse files
.summary/0/events.out.tfevents.1678286079.qgallouedec-MS-7C84 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69b89313cd1a881e17a47ff9388cb59a886a2aced9126dae7076d4f3b970673d
3
- size 1954598
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99cecd26758e5938e18fda367db078079b7867f0ebe0b1848c08776398a920d4
3
+ size 4964113
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: hand-insert-v2
16
  metrics:
17
  - type: mean_reward
18
- value: 12.85 +/- 5.03
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: hand-insert-v2
16
  metrics:
17
  - type: mean_reward
18
+ value: 4295.54 +/- 1298.36
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000184960_94699520_reward_4719.047.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68278cb6570af4eff04f454f5e06000abf938a6eaab3e9ed79bdc89174b389c4
3
+ size 98239
checkpoint_p0/checkpoint_000195208_99946496.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:944b1247942c821f9c02fe77c31227c45bcca5e81836d0023daf80070bf44779
3
+ size 98567
checkpoint_p0/checkpoint_000195328_100007936.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdfda9847b96835f2b8ce3c1909e6cd9fbc0ad8b1e68fa5f931931d17f5340a9
3
+ size 98567
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "env": "hand-insert-v2",
5
  "experiment": "hand-insert-v2",
6
  "train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
7
- "restart_behavior": "restart",
8
  "device": "cpu",
9
  "seed": null,
10
  "num_policies": 1,
@@ -24,7 +24,7 @@
24
  "recurrence": 1,
25
  "shuffle_minibatches": false,
26
  "gamma": 0.99,
27
- "reward_scale": 0.1,
28
  "reward_clip": 1000.0,
29
  "value_bootstrap": true,
30
  "normalize_returns": true,
@@ -120,15 +120,17 @@
120
  "pbt_target_objective": "true_objective",
121
  "pbt_perturb_min": 1.1,
122
  "pbt_perturb_max": 1.5,
123
- "command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld",
124
  "cli_args": {
125
  "env": "hand-insert-v2",
126
  "experiment": "hand-insert-v2",
 
 
127
  "with_wandb": true,
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
- "git_hash": "2bb8d8c9cd813ffeafaad42038b1e71364092d36",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
- "wandb_unique_id": "hand-insert-v2_20230308_185042_269468"
134
  }
 
4
  "env": "hand-insert-v2",
5
  "experiment": "hand-insert-v2",
6
  "train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
7
+ "restart_behavior": "resume",
8
  "device": "cpu",
9
  "seed": null,
10
  "num_policies": 1,
 
24
  "recurrence": 1,
25
  "shuffle_minibatches": false,
26
  "gamma": 0.99,
27
+ "reward_scale": 0.01,
28
  "reward_clip": 1000.0,
29
  "value_bootstrap": true,
30
  "normalize_returns": true,
 
120
  "pbt_target_objective": "true_objective",
121
  "pbt_perturb_min": 1.1,
122
  "pbt_perturb_max": 1.5,
123
+ "command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld --train_for_env_steps 100000000 --reward_scale 0.01",
124
  "cli_args": {
125
  "env": "hand-insert-v2",
126
  "experiment": "hand-insert-v2",
127
+ "reward_scale": 0.01,
128
+ "train_for_env_steps": 100000000,
129
  "with_wandb": true,
130
  "wandb_user": "qgallouedec",
131
  "wandb_project": "sample_facotry_metaworld"
132
  },
133
+ "git_hash": "44aa76c42f03edbe61877f2b20879ac5319e5842",
134
  "git_repo_name": "https://github.com/huggingface/gia",
135
+ "wandb_unique_id": "hand-insert-v2_20230308_153436_728632"
136
  }
git.diff CHANGED
@@ -1,61 +0,0 @@
1
- diff --git a/data/envs/metaworld/train_all.sh b/data/envs/metaworld/train_all.sh
2
- index dbf328a..c412d01 100755
3
- --- a/data/envs/metaworld/train_all.sh
4
- +++ b/data/envs/metaworld/train_all.sh
5
- @@ -1,28 +1,28 @@
6
- #!/bin/bash
7
-
8
- ENVS=(
9
- - assembly
10
- - basketball
11
- - bin-picking
12
- - box-close
13
- - button-press-topdown
14
- - button-press-topdown-wall
15
- - button-press
16
- - button-press-wall
17
- - coffee-button
18
- - coffee-pull
19
- - coffee-push
20
- - dial-turn
21
- - disassemble
22
- - door-close
23
- - door-lock
24
- - door-open
25
- - door-unlock
26
- - drawer-close
27
- - drawer-open
28
- - faucet-close
29
- - faucet-open
30
- - hammer
31
- + # assembly
32
- + # basketball
33
- + # bin-picking
34
- + # box-close
35
- + # button-press-topdown
36
- + # button-press-topdown-wall
37
- + # button-press
38
- + # button-press-wall
39
- + # coffee-button
40
- + # coffee-pull
41
- + # coffee-push
42
- + # dial-turn
43
- + # disassemble
44
- + # door-close
45
- + # door-lock
46
- + # door-open
47
- + # door-unlock
48
- + # drawer-close
49
- + # drawer-open
50
- + # faucet-close
51
- + # faucet-open
52
- + # hammer
53
- hand-insert
54
- handle-press-side
55
- handle-press
56
- @@ -55,4 +55,5 @@ ENVS=(
57
-
58
- for ENV in "${ENVS[@]}"; do
59
- python train.py --env $ENV-v2 --experiment $ENV-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld
60
- + python enjoy.py --algo=APPO --env $ENV-v2 --experiment $ENV-v2 --train_dir=./train_dir --max_num_episodes=10 --push_to_hub --hf_repository=qgallouedec/sample-factory-$ENV-v2 --save_video --no_render --enjoy_script=enjoy --train_script=train --load_checkpoint_kind best
61
- done
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f119d516d12805f1f08703d15334d766c9c035ea58e09cd30be4bf7cfe43e2f
3
- size 2668517
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87a1d832b52692f42e95a6859cf3363a2989963f4721106fe5a968db30eb90de
3
+ size 2016827
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff