Commit
·
952a097
1
Parent(s):
8baf463
Upload . with huggingface_hub
Browse files- .summary/0/events.out.tfevents.1678286079.qgallouedec-MS-7C84 +2 -2
- README.md +1 -1
- checkpoint_p0/best_000184960_94699520_reward_4719.047.pth +3 -0
- checkpoint_p0/checkpoint_000195208_99946496.pth +3 -0
- checkpoint_p0/checkpoint_000195328_100007936.pth +3 -0
- config.json +7 -5
- git.diff +0 -61
- replay.mp4 +2 -2
- sf_log.txt +0 -0
.summary/0/events.out.tfevents.1678286079.qgallouedec-MS-7C84
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99cecd26758e5938e18fda367db078079b7867f0ebe0b1848c08776398a920d4
|
| 3 |
+
size 4964113
|
README.md
CHANGED
|
@@ -15,7 +15,7 @@ model-index:
|
|
| 15 |
type: hand-insert-v2
|
| 16 |
metrics:
|
| 17 |
- type: mean_reward
|
| 18 |
-
value:
|
| 19 |
name: mean_reward
|
| 20 |
verified: false
|
| 21 |
---
|
|
|
|
| 15 |
type: hand-insert-v2
|
| 16 |
metrics:
|
| 17 |
- type: mean_reward
|
| 18 |
+
value: 4295.54 +/- 1298.36
|
| 19 |
name: mean_reward
|
| 20 |
verified: false
|
| 21 |
---
|
checkpoint_p0/best_000184960_94699520_reward_4719.047.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68278cb6570af4eff04f454f5e06000abf938a6eaab3e9ed79bdc89174b389c4
|
| 3 |
+
size 98239
|
checkpoint_p0/checkpoint_000195208_99946496.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:944b1247942c821f9c02fe77c31227c45bcca5e81836d0023daf80070bf44779
|
| 3 |
+
size 98567
|
checkpoint_p0/checkpoint_000195328_100007936.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdfda9847b96835f2b8ce3c1909e6cd9fbc0ad8b1e68fa5f931931d17f5340a9
|
| 3 |
+
size 98567
|
config.json
CHANGED
|
@@ -4,7 +4,7 @@
|
|
| 4 |
"env": "hand-insert-v2",
|
| 5 |
"experiment": "hand-insert-v2",
|
| 6 |
"train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
|
| 7 |
-
"restart_behavior": "
|
| 8 |
"device": "cpu",
|
| 9 |
"seed": null,
|
| 10 |
"num_policies": 1,
|
|
@@ -24,7 +24,7 @@
|
|
| 24 |
"recurrence": 1,
|
| 25 |
"shuffle_minibatches": false,
|
| 26 |
"gamma": 0.99,
|
| 27 |
-
"reward_scale": 0.
|
| 28 |
"reward_clip": 1000.0,
|
| 29 |
"value_bootstrap": true,
|
| 30 |
"normalize_returns": true,
|
|
@@ -120,15 +120,17 @@
|
|
| 120 |
"pbt_target_objective": "true_objective",
|
| 121 |
"pbt_perturb_min": 1.1,
|
| 122 |
"pbt_perturb_max": 1.5,
|
| 123 |
-
"command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld",
|
| 124 |
"cli_args": {
|
| 125 |
"env": "hand-insert-v2",
|
| 126 |
"experiment": "hand-insert-v2",
|
|
|
|
|
|
|
| 127 |
"with_wandb": true,
|
| 128 |
"wandb_user": "qgallouedec",
|
| 129 |
"wandb_project": "sample_facotry_metaworld"
|
| 130 |
},
|
| 131 |
-
"git_hash": "
|
| 132 |
"git_repo_name": "https://github.com/huggingface/gia",
|
| 133 |
-
"wandb_unique_id": "hand-insert-
|
| 134 |
}
|
|
|
|
| 4 |
"env": "hand-insert-v2",
|
| 5 |
"experiment": "hand-insert-v2",
|
| 6 |
"train_dir": "/home/qgallouedec/gia/data/envs/metaworld/train_dir",
|
| 7 |
+
"restart_behavior": "resume",
|
| 8 |
"device": "cpu",
|
| 9 |
"seed": null,
|
| 10 |
"num_policies": 1,
|
|
|
|
| 24 |
"recurrence": 1,
|
| 25 |
"shuffle_minibatches": false,
|
| 26 |
"gamma": 0.99,
|
| 27 |
+
"reward_scale": 0.01,
|
| 28 |
"reward_clip": 1000.0,
|
| 29 |
"value_bootstrap": true,
|
| 30 |
"normalize_returns": true,
|
|
|
|
| 120 |
"pbt_target_objective": "true_objective",
|
| 121 |
"pbt_perturb_min": 1.1,
|
| 122 |
"pbt_perturb_max": 1.5,
|
| 123 |
+
"command_line": "--env hand-insert-v2 --experiment hand-insert-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld --train_for_env_steps 100000000 --reward_scale 0.01",
|
| 124 |
"cli_args": {
|
| 125 |
"env": "hand-insert-v2",
|
| 126 |
"experiment": "hand-insert-v2",
|
| 127 |
+
"reward_scale": 0.01,
|
| 128 |
+
"train_for_env_steps": 100000000,
|
| 129 |
"with_wandb": true,
|
| 130 |
"wandb_user": "qgallouedec",
|
| 131 |
"wandb_project": "sample_facotry_metaworld"
|
| 132 |
},
|
| 133 |
+
"git_hash": "44aa76c42f03edbe61877f2b20879ac5319e5842",
|
| 134 |
"git_repo_name": "https://github.com/huggingface/gia",
|
| 135 |
+
"wandb_unique_id": "hand-insert-v2_20230308_153436_728632"
|
| 136 |
}
|
git.diff
CHANGED
|
@@ -1,61 +0,0 @@
|
|
| 1 |
-
diff --git a/data/envs/metaworld/train_all.sh b/data/envs/metaworld/train_all.sh
|
| 2 |
-
index dbf328a..c412d01 100755
|
| 3 |
-
--- a/data/envs/metaworld/train_all.sh
|
| 4 |
-
+++ b/data/envs/metaworld/train_all.sh
|
| 5 |
-
@@ -1,28 +1,28 @@
|
| 6 |
-
#!/bin/bash
|
| 7 |
-
|
| 8 |
-
ENVS=(
|
| 9 |
-
- assembly
|
| 10 |
-
- basketball
|
| 11 |
-
- bin-picking
|
| 12 |
-
- box-close
|
| 13 |
-
- button-press-topdown
|
| 14 |
-
- button-press-topdown-wall
|
| 15 |
-
- button-press
|
| 16 |
-
- button-press-wall
|
| 17 |
-
- coffee-button
|
| 18 |
-
- coffee-pull
|
| 19 |
-
- coffee-push
|
| 20 |
-
- dial-turn
|
| 21 |
-
- disassemble
|
| 22 |
-
- door-close
|
| 23 |
-
- door-lock
|
| 24 |
-
- door-open
|
| 25 |
-
- door-unlock
|
| 26 |
-
- drawer-close
|
| 27 |
-
- drawer-open
|
| 28 |
-
- faucet-close
|
| 29 |
-
- faucet-open
|
| 30 |
-
- hammer
|
| 31 |
-
+ # assembly
|
| 32 |
-
+ # basketball
|
| 33 |
-
+ # bin-picking
|
| 34 |
-
+ # box-close
|
| 35 |
-
+ # button-press-topdown
|
| 36 |
-
+ # button-press-topdown-wall
|
| 37 |
-
+ # button-press
|
| 38 |
-
+ # button-press-wall
|
| 39 |
-
+ # coffee-button
|
| 40 |
-
+ # coffee-pull
|
| 41 |
-
+ # coffee-push
|
| 42 |
-
+ # dial-turn
|
| 43 |
-
+ # disassemble
|
| 44 |
-
+ # door-close
|
| 45 |
-
+ # door-lock
|
| 46 |
-
+ # door-open
|
| 47 |
-
+ # door-unlock
|
| 48 |
-
+ # drawer-close
|
| 49 |
-
+ # drawer-open
|
| 50 |
-
+ # faucet-close
|
| 51 |
-
+ # faucet-open
|
| 52 |
-
+ # hammer
|
| 53 |
-
hand-insert
|
| 54 |
-
handle-press-side
|
| 55 |
-
handle-press
|
| 56 |
-
@@ -55,4 +55,5 @@ ENVS=(
|
| 57 |
-
|
| 58 |
-
for ENV in "${ENVS[@]}"; do
|
| 59 |
-
python train.py --env $ENV-v2 --experiment $ENV-v2 --with_wandb True --wandb_user qgallouedec --wandb_project sample_facotry_metaworld
|
| 60 |
-
+ python enjoy.py --algo=APPO --env $ENV-v2 --experiment $ENV-v2 --train_dir=./train_dir --max_num_episodes=10 --push_to_hub --hf_repository=qgallouedec/sample-factory-$ENV-v2 --save_video --no_render --enjoy_script=enjoy --train_script=train --load_checkpoint_kind best
|
| 61 |
-
done
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
replay.mp4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87a1d832b52692f42e95a6859cf3363a2989963f4721106fe5a968db30eb90de
|
| 3 |
+
size 2016827
|
sf_log.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|