Upload CQL_model.yaml
Browse files- CQL_model.yaml +30 -0
CQL_model.yaml
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# -- Model Description --
|
| 2 |
+
#
|
| 3 |
+
algorithm: quantile
|
| 4 |
+
env: ac-pulse
|
| 5 |
+
dataset_version: v12
|
| 6 |
+
trainer_version: CQL
|
| 7 |
+
|
| 8 |
+
train:
|
| 9 |
+
dataset_name: 500k_dataset
|
| 10 |
+
init_checkpoint_dir: ""
|
| 11 |
+
gin_files: ["src/batch_rl/fixed_replay/configs/quantile.gin"]
|
| 12 |
+
gin_bindings:
|
| 13 |
+
[
|
| 14 |
+
"FixedReplayRunner.num_iterations=1000",
|
| 15 |
+
"FixedReplayQuantileAgent.minq_weight=4.0",
|
| 16 |
+
"FixedReplayRunner.training_steps=250000",
|
| 17 |
+
]
|
| 18 |
+
load_last_checkpoint: False
|
| 19 |
+
load_experiment_checkpoint: False
|
| 20 |
+
train_id: Null
|
| 21 |
+
env_config:
|
| 22 |
+
obs_shape: 63
|
| 23 |
+
|
| 24 |
+
evaluation_dataset_version: v11
|
| 25 |
+
evaluation_dataset_name: 10k_uniform_dataset_users
|
| 26 |
+
|
| 27 |
+
evaluation:
|
| 28 |
+
only_during_train: True
|
| 29 |
+
|
| 30 |
+
config: {}
|