nbtpj commited on
Commit
5bcec5b
·
verified ·
1 Parent(s): 174b104

Upload ray_tune_logs/params.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. ray_tune_logs/params.json +113 -0
ray_tune_logs/params.json ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train_loop_config": {
3
+ "a2g_norm": true,
4
+ "base_path": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2",
5
+ "beta_coef": "0.0",
6
+ "block_size": 1024,
7
+ "causal_model": true,
8
+ "checkpoint_interval": "100",
9
+ "clamp_update": false,
10
+ "config_name": null,
11
+ "constraint_type": "kl",
12
+ "cpu_per_worker": 7,
13
+ "dataset_config_name": null,
14
+ "dataset_name": "nbtpj/summ_ds_train",
15
+ "ent_coef": 0.0001,
16
+ "epsilon": 0.2,
17
+ "eval_interval": "100",
18
+ "freeze_role2": false,
19
+ "gamma": 0.95,
20
+ "gpu_per_worker": 1,
21
+ "grad_norm": 0.5,
22
+ "gradient_accumulation_steps": 1,
23
+ "gradient_checkpoint": false,
24
+ "group_relative_norm": true,
25
+ "inference_config": {
26
+ "do_sample": true,
27
+ "max_new_tokens": 250,
28
+ "min_new_tokens": 5,
29
+ "temperature": 0.0
30
+ },
31
+ "keep_eval_size": false,
32
+ "label_col": "summary",
33
+ "learning_rate": 3e-07,
34
+ "lm_fraction": -1.0,
35
+ "lm_w": 1.0,
36
+ "log_interval": "5m",
37
+ "log_rollout_txt": true,
38
+ "lora": true,
39
+ "lr_scheduler_type": "constant",
40
+ "max_train_rollouts": 100000,
41
+ "max_train_steps": 40000,
42
+ "mini_epoch": 1,
43
+ "mixed_precision": "bf16",
44
+ "model_name_or_path": "gpt2",
45
+ "model_type": null,
46
+ "n_augment": 0,
47
+ "n_generate": 4,
48
+ "need_attn_mask": true,
49
+ "num_warmup_steps": 200,
50
+ "only_train_role1": false,
51
+ "per_device_eval_batch_size": 4,
52
+ "per_device_query_rollout_batch_size": 32,
53
+ "per_device_train_batch_size": 4,
54
+ "pretrained_role2_name_or_path": "none",
55
+ "prompt_0": "{text}",
56
+ "prompt_1": "{text}\nTL;DR: ",
57
+ "prompt_2": "Given the text: {role1_output}\nReconstruct the summarized text to the detailed:",
58
+ "prompt_eval": "{text}\nTL;DR:",
59
+ "push_to_hub": null,
60
+ "ref_role1_name_or_path": "gpt2",
61
+ "ref_role2_name_or_path": "gpt2",
62
+ "rl_algo": "on_policy",
63
+ "rl_w": 1.0,
64
+ "rollout_config": {
65
+ "accuracy_w": 1.5676677195506077,
66
+ "accuracy_w2": 7.257005721594282,
67
+ "len_pen": 1.0,
68
+ "len_pen2": 1.0,
69
+ "similarity_fn": "rouge",
70
+ "threshold": 0.01605191133358762
71
+ },
72
+ "rollout_game": "baseline3v2",
73
+ "sample_config": {
74
+ "do_sample": true,
75
+ "min_new_tokens": 20,
76
+ "temperature": 1.0
77
+ },
78
+ "script": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2/execute/utune/debug.py",
79
+ "seed": 0,
80
+ "test_clm": false,
81
+ "test_gen": true,
82
+ "test_glue": false,
83
+ "text_template": "{text}\nTL;DR: {summary}",
84
+ "tokenizer_name": null,
85
+ "train_from_raw": true,
86
+ "train_split_name": "merge36_cnndmsamsumxsum",
87
+ "trunc_eval": 256,
88
+ "trunc_evals": [
89
+ "cnndm___12",
90
+ "samsum___12",
91
+ "xsum___12",
92
+ "gigaword___200",
93
+ "duc___50"
94
+ ],
95
+ "trust_remote_code": true,
96
+ "tune_metrics": [
97
+ "cnndm/rouge1___1.0",
98
+ "cnndm/bertscore_f1___0.25",
99
+ "samsum/rouge1___1.0",
100
+ "samsum/bertscore_f1___0.25",
101
+ "xsum/rouge1___1.0",
102
+ "xsum/bertscore_f1___0.25"
103
+ ],
104
+ "use_deepspeed": false,
105
+ "use_slow_tokenizer": false,
106
+ "vectorizer_path": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2/vectorizer/wikitext103_tfidf_full.joblib",
107
+ "vllm_sleep": true,
108
+ "vllm_vram_ratio": 0.3,
109
+ "weight_decay": 1e-05,
110
+ "world_size": 1,
111
+ "zero_config": 2
112
+ }
113
+ }