qgallouedec HF Staff commited on
Commit
87ddc26
·
1 Parent(s): 78b24cd

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1689616460.qgallouedec-MS-7C84 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14ac072b47f163b9b40b9943ca0d04070cd968546cfdcd55b958b3c95ec2bce
3
+ size 700314
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: bin-picking-v2
16
  metrics:
17
  - type: mean_reward
18
- value: 61.02 +/- 36.03
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: bin-picking-v2
16
  metrics:
17
  - type: mean_reward
18
+ value: 452.37 +/- 36.53
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000019264_9863168_reward_428.167.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f5623aadf2391036a6b0375de622dcbf299d8bf7f1e8f7a45875552255db93
3
+ size 98239
checkpoint_p0/checkpoint_000019472_9969664.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5bdba43d6c84fa46e0458b9f3ff3669f02f85381a0208c6f097e08900f02fa2
3
+ size 98567
checkpoint_p0/checkpoint_000019544_10006528.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e95491e121d7872b3757d667aee9955960d19ada63238ec94b4cade1bc05f64
3
  size 98567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e3659821692b5baebd00d6b39e856f2434f8c4c6c796d8da43a5eb80c302359
3
  size 98567
config.json CHANGED
@@ -128,7 +128,7 @@
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
- "git_hash": "66db1b7a27030aa65fcfa2d6e3503089a7cff207",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
- "wandb_unique_id": "bin-picking-v2_20230708_124717_514721"
134
  }
 
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
+ "git_hash": "952d4a00946fa97ee3267d32a2160be9933e887a",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
+ "wandb_unique_id": "bin-picking-v2_20230717_195418_651812"
134
  }
git.diff CHANGED
@@ -1,3 +1,140 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  diff --git a/gia/eval/callback.py b/gia/eval/callback.py
2
  index 5c3a080..4b6198f 100644
3
  --- a/gia/eval/callback.py
@@ -14,70 +151,21 @@ index 5c3a080..4b6198f 100644
14
  from gia.config import Arguments
15
  from gia.eval.utils import is_slurm_available
16
 
17
- diff --git a/gia/eval/evaluator.py b/gia/eval/evaluator.py
18
- index 91b645c..3e2cae7 100644
19
- --- a/gia/eval/evaluator.py
20
- +++ b/gia/eval/evaluator.py
21
- @@ -1,3 +1,5 @@
22
- +from typing import Optional
23
- +
24
- import torch
25
-
26
- from gia.config.arguments import Arguments
27
- @@ -5,11 +7,12 @@ from gia.model import GiaModel
28
-
29
-
30
- class Evaluator:
31
- - def __init__(self, args: Arguments, task: str) -> None:
32
- + def __init__(self, args: Arguments, task: str, mean_random: Optional[float] = None) -> None:
33
- self.args = args
34
- self.task = task
35
- + self.mean_random = mean_random
36
-
37
- - @torch.no_grad()
38
- + @torch.inference_mode()
39
- def evaluate(self, model: GiaModel) -> float:
40
- return self._evaluate(model)
41
-
42
- diff --git a/gia/eval/rl/envs/core.py b/gia/eval/rl/envs/core.py
43
- index ec5e5b2..eeaf7cb 100644
44
- --- a/gia/eval/rl/envs/core.py
45
- +++ b/gia/eval/rl/envs/core.py
46
- @@ -177,7 +177,6 @@ def make(task_name: str, num_envs: int = 1):
47
-
48
- elif task_name.startswith("metaworld"):
49
- import gymnasium as gym
50
- - import metaworld
51
-
52
- env_id = TASK_TO_ENV_MAPPING[task_name]
53
- env = gym.vector.SyncVectorEnv([lambda: gym.make(env_id)] * num_envs)
54
  diff --git a/gia/eval/rl/gia_agent.py b/gia/eval/rl/gia_agent.py
55
- index f0d0b9b..39dc0d2 100644
56
  --- a/gia/eval/rl/gia_agent.py
57
  +++ b/gia/eval/rl/gia_agent.py
58
- @@ -54,7 +54,7 @@ class GiaAgent:
59
- self.action_space = action_space
60
- self.deterministic = deterministic
61
- self.device = next(model.parameters()).device
62
- - self._max_length = self.model.config.max_position_embeddings - 10
63
- + self._max_length = self.model.config.max_position_embeddings - 100 # TODO: fix this
64
-
65
- if isinstance(observation_space, spaces.Box):
66
- self._observation_key = "continuous_observations"
67
- @@ -75,6 +75,11 @@ class GiaAgent:
68
- ) -> Tuple[Tuple[Tensor, Tensor], ...]:
69
- return tuple((k[:, :, -self._max_length :], v[:, :, -self._max_length :]) for (k, v) in past_key_values)
70
-
71
- + def set_model(self, model: GiaModel) -> None:
72
- + self.model = model
73
- + self.device = next(model.parameters()).device
74
- + self._max_length = self.model.config.max_position_embeddings
75
- +
76
- def reset(self, num_envs: int = 1) -> None:
77
- if self.prompter is not None:
78
- prompts = self.prompter.generate_prompts(num_envs)
79
  diff --git a/gia/eval/rl/gym_evaluator.py b/gia/eval/rl/gym_evaluator.py
80
- index f8531ee..754c05d 100644
81
  --- a/gia/eval/rl/gym_evaluator.py
82
  +++ b/gia/eval/rl/gym_evaluator.py
83
  @@ -1,7 +1,7 @@
@@ -85,37 +173,7 @@ index f8531ee..754c05d 100644
85
  from gym.vector.vector_env import VectorEnv
86
 
87
  -from gia.eval.mappings import TASK_TO_ENV_MAPPING
88
- +# from gia.eval.rl.envs.mappings import TASK_TO_ENV_MAPPING
89
  from gia.eval.rl.rl_evaluator import RLEvaluator
90
 
91
 
92
- diff --git a/gia/eval/rl/rl_evaluator.py b/gia/eval/rl/rl_evaluator.py
93
- index c5cc423..91189f3 100644
94
- --- a/gia/eval/rl/rl_evaluator.py
95
- +++ b/gia/eval/rl/rl_evaluator.py
96
- @@ -8,6 +8,10 @@ from gia.eval.rl.gia_agent import GiaAgent
97
-
98
-
99
- class RLEvaluator(Evaluator):
100
- + def __init__(self, args, task):
101
- + super().__init__(args, task)
102
- + self.agent = GiaAgent()
103
- +
104
- def _build_env(self) -> VectorEnv: # TODO: maybe just a gym.Env ?
105
- raise NotImplementedError
106
-
107
- diff --git a/gia/eval/rl/scores_dict.json b/gia/eval/rl/scores_dict.json
108
- index 1b8ebee..ff7d030 100644
109
- --- a/gia/eval/rl/scores_dict.json
110
- +++ b/gia/eval/rl/scores_dict.json
111
- @@ -929,8 +929,8 @@
112
- },
113
- "metaworld-assembly": {
114
- "expert": {
115
- - "mean": 311.29314618777823,
116
- - "std": 75.04282151450695
117
- + "mean": 3523.81468486244,
118
- + "std": 63.22745220327798
119
- },
120
- "random": {
121
- "mean": 220.65601680730813,
 
1
+ diff --git a/data/envs/metaworld/generate_dataset_all.sh b/data/envs/metaworld/generate_dataset_all.sh
2
+ index acfe879..0185b2b 100755
3
+ --- a/data/envs/metaworld/generate_dataset_all.sh
4
+ +++ b/data/envs/metaworld/generate_dataset_all.sh
5
+ @@ -2,8 +2,6 @@
6
+
7
+ ENVS=(
8
+ assembly
9
+ - basketball
10
+ - bin-picking
11
+ box-close
12
+ button-press-topdown
13
+ button-press-topdown-wall
14
+ @@ -11,9 +9,7 @@ ENVS=(
15
+ button-press-wall
16
+ coffee-button
17
+ coffee-pull
18
+ - coffee-push
19
+ dial-turn
20
+ - disassemble
21
+ door-close
22
+ door-lock
23
+ door-open
24
+ @@ -22,29 +18,15 @@ ENVS=(
25
+ drawer-open
26
+ faucet-close
27
+ faucet-open
28
+ - hammer
29
+ hand-insert
30
+ handle-press-side
31
+ handle-press
32
+ handle-pull-side
33
+ handle-pull
34
+ lever-pull
35
+ - peg-insert-side
36
+ - peg-unplug-side
37
+ - pick-out-of-hole
38
+ - pick-place
39
+ - pick-place-wall
40
+ - plate-slide-back-side
41
+ - plate-slide-back
42
+ - plate-slide-side
43
+ - plate-slide
44
+ push-back
45
+ push
46
+ push-wall
47
+ - reach
48
+ - reach-wall
49
+ - shelf-place
50
+ - soccer
51
+ stick-pull
52
+ stick-push
53
+ sweep-into
54
+ @@ -54,6 +36,6 @@ ENVS=(
55
+ )
56
+
57
+ for ENV in "${ENVS[@]}"; do
58
+ - python -m sample_factory.huggingface.load_from_hub -r qgallouedec/$ENV-v2
59
+ + # python -m sample_factory.huggingface.load_from_hub -r qgallouedec/$ENV-v2
60
+ python generate_dataset.py --env $ENV-v2 --experiment $ENV-v2 --train_dir=./train_dir
61
+ done
62
+ diff --git a/data/envs/metaworld/train_all.sh b/data/envs/metaworld/train_all.sh
63
+ index dbf328a..166ccb8 100755
64
+ --- a/data/envs/metaworld/train_all.sh
65
+ +++ b/data/envs/metaworld/train_all.sh
66
+ @@ -1,56 +1,10 @@
67
+ #!/bin/bash
68
+
69
+ ENVS=(
70
+ - assembly
71
+ - basketball
72
+ bin-picking
73
+ - box-close
74
+ - button-press-topdown
75
+ - button-press-topdown-wall
76
+ - button-press
77
+ - button-press-wall
78
+ - coffee-button
79
+ - coffee-pull
80
+ - coffee-push
81
+ - dial-turn
82
+ disassemble
83
+ - door-close
84
+ - door-lock
85
+ - door-open
86
+ - door-unlock
87
+ - drawer-close
88
+ - drawer-open
89
+ - faucet-close
90
+ - faucet-open
91
+ - hammer
92
+ - hand-insert
93
+ - handle-press-side
94
+ - handle-press
95
+ - handle-pull-side
96
+ - handle-pull
97
+ - lever-pull
98
+ peg-insert-side
99
+ - peg-unplug-side
100
+ - pick-out-of-hole
101
+ - pick-place
102
+ pick-place-wall
103
+ - plate-slide-back-side
104
+ - plate-slide-back
105
+ - plate-slide-side
106
+ - plate-slide
107
+ - push-back
108
+ - push
109
+ - push-wall
110
+ - reach
111
+ - reach-wall
112
+ - shelf-place
113
+ - soccer
114
+ - stick-pull
115
+ - stick-push
116
+ - sweep-into
117
+ - sweep
118
+ - window-close
119
+ - window-open
120
+ )
121
+
122
+ for ENV in "${ENVS[@]}"; do
123
+ diff --git a/data/envs/mujoco/create_mujoco_dataset.sh b/data/envs/mujoco/create_mujoco_dataset.sh
124
+ old mode 100644
125
+ new mode 100755
126
+ index d8ce6d6..c4dfebb
127
+ --- a/data/envs/mujoco/create_mujoco_dataset.sh
128
+ +++ b/data/envs/mujoco/create_mujoco_dataset.sh
129
+ @@ -2,7 +2,7 @@
130
+ # creates 100,000 per environment from models hosted on the hub
131
+
132
+ ENVS=(
133
+ - ant halfcheetah hopper doublependulum pendulum reacher swimmer walker
134
+ + ant
135
+ )
136
+
137
+ for ENV in "${ENVS[@]}"; do
138
  diff --git a/gia/eval/callback.py b/gia/eval/callback.py
139
  index 5c3a080..4b6198f 100644
140
  --- a/gia/eval/callback.py
 
151
  from gia.config import Arguments
152
  from gia.eval.utils import is_slurm_available
153
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
154
  diff --git a/gia/eval/rl/gia_agent.py b/gia/eval/rl/gia_agent.py
155
+ index af6d86e..f6098d4 100644
156
  --- a/gia/eval/rl/gia_agent.py
157
  +++ b/gia/eval/rl/gia_agent.py
158
+ @@ -94,7 +94,7 @@ class GiaAgent:
159
+ elif isinstance(self.observation_space, spaces.MultiDiscrete):
160
+ self._observation_key = "discrete_observations"
161
+ else:
162
+ - raise TypeError("Unsupported observation space")
163
+ + print("Unsupported observation space")
164
+
165
+ if isinstance(self.action_space, spaces.Box):
166
+ self._num_act_tokens = self.action_space.shape[0]
 
 
 
 
 
 
 
 
 
 
 
 
167
  diff --git a/gia/eval/rl/gym_evaluator.py b/gia/eval/rl/gym_evaluator.py
168
+ index f8531ee..44f5f91 100644
169
  --- a/gia/eval/rl/gym_evaluator.py
170
  +++ b/gia/eval/rl/gym_evaluator.py
171
  @@ -1,7 +1,7 @@
 
173
  from gym.vector.vector_env import VectorEnv
174
 
175
  -from gia.eval.mappings import TASK_TO_ENV_MAPPING
176
+ +# from gia.eval.mappings import TASK_TO_ENV_MAPPING
177
  from gia.eval.rl.rl_evaluator import RLEvaluator
178
 
179
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a58adfe94e40a3beb02b16571030b03760b1defa8c0c4ef9f4e0f20b8c463c3
3
- size 677382
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b2a99c438b25270b07f006a63f81bb3814b5df728b5146a00b985950e933201
3
+ size 745108
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff