qgallouedec HF Staff commited on
Commit
0bfb44f
·
1 Parent(s): 2471ab4

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1689589249.qgallouedec-MS-7C84 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28639587c888ad0050e38fe53aa110d6c1ba6d8b8cdb5144f271ab6b81b5d2cf
3
+ size 740627
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: hammer-v2
16
  metrics:
17
  - type: mean_reward
18
- value: 315.73 +/- 31.40
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: hammer-v2
16
  metrics:
17
  - type: mean_reward
18
+ value: 692.49 +/- 21.25
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000018088_9261056_reward_697.151.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f81adf9adcdefd0897f5bd6ffc7e410e342ff7ab3ab3f1d38b7220e6b7448bdd
3
+ size 98239
checkpoint_p0/checkpoint_000019472_9969664.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a373ab520bcb67f4f07612dcef05ab7bfea59654c75e7c8a237a6878ebbff8e7
3
+ size 98567
checkpoint_p0/checkpoint_000019544_10006528.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1cc1f7d714b541dbd6795d814171e4325aeefa81624bf798c116302533aa8b5f
3
  size 98567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7444e8b3bc6e428dc8b717589c89933585a70cef5da893f8c8257af22f3691f2
3
  size 98567
config.json CHANGED
@@ -128,7 +128,7 @@
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
- "git_hash": "66db1b7a27030aa65fcfa2d6e3503089a7cff207",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
- "wandb_unique_id": "hammer-v2_20230708_190205_433334"
134
  }
 
128
  "wandb_user": "qgallouedec",
129
  "wandb_project": "sample_facotry_metaworld"
130
  },
131
+ "git_hash": "998bf2be1819761361d54bcbaf7d9ab9748a770e",
132
  "git_repo_name": "https://github.com/huggingface/gia",
133
+ "wandb_unique_id": "hammer-v2_20230717_122047_003477"
134
  }
git.diff CHANGED
@@ -1,121 +1,122 @@
1
- diff --git a/gia/eval/callback.py b/gia/eval/callback.py
2
- index 5c3a080..4b6198f 100644
3
- --- a/gia/eval/callback.py
4
- +++ b/gia/eval/callback.py
5
- @@ -2,10 +2,10 @@ import glob
6
- import json
7
- import subprocess
8
-
9
- -import wandb
10
- from accelerate import Accelerator
11
- from transformers import TrainerCallback, TrainerControl, TrainerState, TrainingArguments
12
-
13
- +import wandb
14
- from gia.config import Arguments
15
- from gia.eval.utils import is_slurm_available
16
-
17
- diff --git a/gia/eval/evaluator.py b/gia/eval/evaluator.py
18
- index 91b645c..3e2cae7 100644
19
- --- a/gia/eval/evaluator.py
20
- +++ b/gia/eval/evaluator.py
21
- @@ -1,3 +1,5 @@
22
- +from typing import Optional
23
- +
24
- import torch
25
-
26
- from gia.config.arguments import Arguments
27
- @@ -5,11 +7,12 @@ from gia.model import GiaModel
28
-
29
-
30
- class Evaluator:
31
- - def __init__(self, args: Arguments, task: str) -> None:
32
- + def __init__(self, args: Arguments, task: str, mean_random: Optional[float] = None) -> None:
33
- self.args = args
34
- self.task = task
35
- + self.mean_random = mean_random
36
-
37
- - @torch.no_grad()
38
- + @torch.inference_mode()
39
- def evaluate(self, model: GiaModel) -> float:
40
- return self._evaluate(model)
41
-
42
- diff --git a/gia/eval/rl/envs/core.py b/gia/eval/rl/envs/core.py
43
- index ec5e5b2..eeaf7cb 100644
44
- --- a/gia/eval/rl/envs/core.py
45
- +++ b/gia/eval/rl/envs/core.py
46
- @@ -177,7 +177,6 @@ def make(task_name: str, num_envs: int = 1):
47
-
48
- elif task_name.startswith("metaworld"):
49
- import gymnasium as gym
50
- - import metaworld
51
-
52
- env_id = TASK_TO_ENV_MAPPING[task_name]
53
- env = gym.vector.SyncVectorEnv([lambda: gym.make(env_id)] * num_envs)
54
- diff --git a/gia/eval/rl/gia_agent.py b/gia/eval/rl/gia_agent.py
55
- index f0d0b9b..39dc0d2 100644
56
- --- a/gia/eval/rl/gia_agent.py
57
- +++ b/gia/eval/rl/gia_agent.py
58
- @@ -54,7 +54,7 @@ class GiaAgent:
59
- self.action_space = action_space
60
- self.deterministic = deterministic
61
- self.device = next(model.parameters()).device
62
- - self._max_length = self.model.config.max_position_embeddings - 10
63
- + self._max_length = self.model.config.max_position_embeddings - 100 # TODO: fix this
64
-
65
- if isinstance(observation_space, spaces.Box):
66
- self._observation_key = "continuous_observations"
67
- @@ -75,6 +75,11 @@ class GiaAgent:
68
- ) -> Tuple[Tuple[Tensor, Tensor], ...]:
69
- return tuple((k[:, :, -self._max_length :], v[:, :, -self._max_length :]) for (k, v) in past_key_values)
70
-
71
- + def set_model(self, model: GiaModel) -> None:
72
- + self.model = model
73
- + self.device = next(model.parameters()).device
74
- + self._max_length = self.model.config.max_position_embeddings
75
- +
76
- def reset(self, num_envs: int = 1) -> None:
77
- if self.prompter is not None:
78
- prompts = self.prompter.generate_prompts(num_envs)
79
- diff --git a/gia/eval/rl/gym_evaluator.py b/gia/eval/rl/gym_evaluator.py
80
- index f8531ee..754c05d 100644
81
- --- a/gia/eval/rl/gym_evaluator.py
82
- +++ b/gia/eval/rl/gym_evaluator.py
83
- @@ -1,7 +1,7 @@
84
- import gym
85
- from gym.vector.vector_env import VectorEnv
86
-
87
- -from gia.eval.mappings import TASK_TO_ENV_MAPPING
88
- +# from gia.eval.rl.envs.mappings import TASK_TO_ENV_MAPPING
89
- from gia.eval.rl.rl_evaluator import RLEvaluator
90
-
91
-
92
- diff --git a/gia/eval/rl/rl_evaluator.py b/gia/eval/rl/rl_evaluator.py
93
- index c5cc423..91189f3 100644
94
- --- a/gia/eval/rl/rl_evaluator.py
95
- +++ b/gia/eval/rl/rl_evaluator.py
96
- @@ -8,6 +8,10 @@ from gia.eval.rl.gia_agent import GiaAgent
97
-
98
-
99
- class RLEvaluator(Evaluator):
100
- + def __init__(self, args, task):
101
- + super().__init__(args, task)
102
- + self.agent = GiaAgent()
103
- +
104
- def _build_env(self) -> VectorEnv: # TODO: maybe just a gym.Env ?
105
- raise NotImplementedError
106
-
107
- diff --git a/gia/eval/rl/scores_dict.json b/gia/eval/rl/scores_dict.json
108
- index 1b8ebee..ff7d030 100644
109
- --- a/gia/eval/rl/scores_dict.json
110
- +++ b/gia/eval/rl/scores_dict.json
111
- @@ -929,8 +929,8 @@
112
- },
113
- "metaworld-assembly": {
114
- "expert": {
115
- - "mean": 311.29314618777823,
116
- - "std": 75.04282151450695
117
- + "mean": 3523.81468486244,
118
- + "std": 63.22745220327798
119
- },
120
- "random": {
121
- "mean": 220.65601680730813,
 
 
1
+ diff --git a/data/envs/metaworld/generate_dataset_all.sh b/data/envs/metaworld/generate_dataset_all.sh
2
+ index acfe879..0185b2b 100755
3
+ --- a/data/envs/metaworld/generate_dataset_all.sh
4
+ +++ b/data/envs/metaworld/generate_dataset_all.sh
5
+ @@ -2,8 +2,6 @@
6
+
7
+ ENVS=(
8
+ assembly
9
+ - basketball
10
+ - bin-picking
11
+ box-close
12
+ button-press-topdown
13
+ button-press-topdown-wall
14
+ @@ -11,9 +9,7 @@ ENVS=(
15
+ button-press-wall
16
+ coffee-button
17
+ coffee-pull
18
+ - coffee-push
19
+ dial-turn
20
+ - disassemble
21
+ door-close
22
+ door-lock
23
+ door-open
24
+ @@ -22,29 +18,15 @@ ENVS=(
25
+ drawer-open
26
+ faucet-close
27
+ faucet-open
28
+ - hammer
29
+ hand-insert
30
+ handle-press-side
31
+ handle-press
32
+ handle-pull-side
33
+ handle-pull
34
+ lever-pull
35
+ - peg-insert-side
36
+ - peg-unplug-side
37
+ - pick-out-of-hole
38
+ - pick-place
39
+ - pick-place-wall
40
+ - plate-slide-back-side
41
+ - plate-slide-back
42
+ - plate-slide-side
43
+ - plate-slide
44
+ push-back
45
+ push
46
+ push-wall
47
+ - reach
48
+ - reach-wall
49
+ - shelf-place
50
+ - soccer
51
+ stick-pull
52
+ stick-push
53
+ sweep-into
54
+ @@ -54,6 +36,6 @@ ENVS=(
55
+ )
56
+
57
+ for ENV in "${ENVS[@]}"; do
58
+ - python -m sample_factory.huggingface.load_from_hub -r qgallouedec/$ENV-v2
59
+ + # python -m sample_factory.huggingface.load_from_hub -r qgallouedec/$ENV-v2
60
+ python generate_dataset.py --env $ENV-v2 --experiment $ENV-v2 --train_dir=./train_dir
61
+ done
62
+ diff --git a/data/envs/metaworld/train_all.sh b/data/envs/metaworld/train_all.sh
63
+ index dbf328a..7b2fb85 100755
64
+ --- a/data/envs/metaworld/train_all.sh
65
+ +++ b/data/envs/metaworld/train_all.sh
66
+ @@ -1,56 +1,15 @@
67
+ #!/bin/bash
68
+
69
+ ENVS=(
70
+ - assembly
71
+ - basketball
72
+ bin-picking
73
+ - box-close
74
+ - button-press-topdown
75
+ - button-press-topdown-wall
76
+ - button-press
77
+ - button-press-wall
78
+ - coffee-button
79
+ - coffee-pull
80
+ - coffee-push
81
+ - dial-turn
82
+ disassemble
83
+ - door-close
84
+ - door-lock
85
+ - door-open
86
+ - door-unlock
87
+ - drawer-close
88
+ - drawer-open
89
+ - faucet-close
90
+ - faucet-open
91
+ hammer
92
+ - hand-insert
93
+ - handle-press-side
94
+ - handle-press
95
+ - handle-pull-side
96
+ - handle-pull
97
+ - lever-pull
98
+ peg-insert-side
99
+ - peg-unplug-side
100
+ pick-out-of-hole
101
+ pick-place
102
+ pick-place-wall
103
+ - plate-slide-back-side
104
+ - plate-slide-back
105
+ - plate-slide-side
106
+ - plate-slide
107
+ - push-back
108
+ - push
109
+ - push-wall
110
+ - reach
111
+ - reach-wall
112
+ shelf-place
113
+ soccer
114
+ - stick-pull
115
+ - stick-push
116
+ - sweep-into
117
+ - sweep
118
+ - window-close
119
+ - window-open
120
+ )
121
+
122
+ for ENV in "${ENVS[@]}"; do
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff