hug-me-please commited on
Commit
b1ab320
·
verified ·
1 Parent(s): fd090b3

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.json +51 -0
  2. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "accelerator_kwargs": {},
3
+ "adap_kl_ctrl": true,
4
+ "backward_batch_size": 1,
5
+ "batch_size": 64,
6
+ "cliprange": 0.2,
7
+ "cliprange_value": 0.2,
8
+ "compare_steps": 1,
9
+ "dataset_num_proc": null,
10
+ "early_stopping": true,
11
+ "exp_name": "rl_training",
12
+ "forward_batch_size": null,
13
+ "gamma": 1,
14
+ "global_backward_batch_size": 1,
15
+ "global_batch_size": 64,
16
+ "gradient_accumulation_steps": 1,
17
+ "gradient_checkpointing": false,
18
+ "horizon": 10000,
19
+ "init_kl_coef": 0.2,
20
+ "is_encoder_decoder": false,
21
+ "is_peft_model": true,
22
+ "kl_penalty": "kl",
23
+ "lam": 0.95,
24
+ "learning_rate": 1.4e-05,
25
+ "log_with": "mlflow",
26
+ "max_grad_norm": null,
27
+ "mini_batch_size": 1,
28
+ "model_name": "DLI-Lab/camel",
29
+ "optimize_cuda_cache": true,
30
+ "optimize_device_cache": false,
31
+ "ppo_epochs": 4,
32
+ "project_kwargs": {},
33
+ "push_to_hub_if_best_kwargs": {},
34
+ "query_dataset": "imdb",
35
+ "ratio_threshold": 10.0,
36
+ "remove_unused_columns": true,
37
+ "reward_model": "sentiment-analysis:lvwerra/distilbert-imdb",
38
+ "score_clip": null,
39
+ "seed": 0,
40
+ "steps": 10000,
41
+ "target": 6,
42
+ "target_kl": 0.1,
43
+ "task_name": null,
44
+ "tracker_kwargs": {},
45
+ "tracker_project_name": "trl",
46
+ "use_score_norm": false,
47
+ "use_score_scaling": false,
48
+ "vf_coef": 0.1,
49
+ "whiten_rewards": false,
50
+ "world_size": 1
51
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae489432c27a7e85f40bdca42acd2f30e01ad9a447a4fae340354db5fdd3285
3
+ size 17916