debug_gpt2 / train_configs.json
nbtpj's picture
Upload best model checkpoint
174b104 verified
{
"dataset_name": "nbtpj/summ_ds_train",
"dataset_config_name": null,
"train_split_name": "merge36_cnndmsamsumxsum",
"text_template": "{text}\nTL;DR: {summary}",
"label_col": "summary",
"freeze_role2": false,
"only_train_role1": false,
"model_name_or_path": "gpt2",
"ref_role1_name_or_path": "gpt2",
"ref_role2_name_or_path": "gpt2",
"pretrained_role2_name_or_path": "none",
"config_name": null,
"vectorizer_path": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2/vectorizer/wikitext103_tfidf_full.joblib",
"tokenizer_name": null,
"use_slow_tokenizer": false,
"per_device_train_batch_size": 4,
"per_device_query_rollout_batch_size": 32,
"per_device_eval_batch_size": 4,
"vllm_vram_ratio": 0.3,
"learning_rate": 3e-07,
"grad_norm": 0.5,
"weight_decay": 1e-05,
"max_train_steps": 40000,
"max_train_rollouts": 100000,
"gradient_accumulation_steps": 1,
"lr_scheduler_type": "constant",
"num_warmup_steps": 200,
"seed": 0,
"model_type": null,
"block_size": 1024,
"mini_epoch": 1,
"rollout_game": "baseline3v2",
"rl_algo": "on_policy",
"constraint_type": "kl",
"clamp_update": false,
"rl_w": 1.0,
"lm_w": 1.0,
"n_generate": 4,
"n_augment": 0,
"gradient_checkpoint": false,
"group_relative_norm": true,
"sample_config": {
"do_sample": true,
"min_new_tokens": 20,
"temperature": 1.0
},
"inference_config": {
"do_sample": true,
"temperature": 0.0,
"min_new_tokens": 5,
"max_new_tokens": 250
},
"rollout_config": {
"accuracy_w": 12.960656597279739,
"len_pen": 1.0,
"accuracy_w2": 30.20289640158668,
"len_pen2": 1.0,
"threshold": 0.09062263471261954,
"similarity_fn": "rouge"
},
"ent_coef": 0.0001,
"beta_coef": "0.0",
"prompt_0": "{text}",
"prompt_1": "{text}\nTL;DR: ",
"prompt_2": "Given the text: {role1_output}\nReconstruct the summarized text to the detailed:",
"prompt_eval": "{text}\nTL;DR:",
"epsilon": 0.2,
"a2g_norm": true,
"vllm_sleep": true,
"lora": false,
"need_attn_mask": true,
"gamma": 0.95,
"trust_remote_code": true,
"test_glue": false,
"test_clm": false,
"causal_model": true,
"test_gen": true,
"log_rollout_txt": true,
"trunc_eval": 256,
"trunc_evals": [
"cnndm___12",
"samsum___12",
"xsum___12",
"gigaword___200",
"duc___50"
],
"use_deepspeed": false,
"zero_config": 2,
"log_interval": "5m",
"eval_interval": "100",
"checkpoint_interval": "100",
"lm_fraction": -1.0,
"push_to_hub": null,
"keep_eval_size": false,
"mixed_precision": "bf16",
"tune_metrics": [
"cnndm/rouge1___1.0",
"cnndm/bertscore_f1___0.25",
"samsum/rouge1___1.0",
"samsum/bertscore_f1___0.25",
"xsum/rouge1___1.0",
"xsum/bertscore_f1___0.25"
],
"base_path": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2",
"script": "/common/home/users/m/mq.nguyen.2023/testcode/SAC_LM/module9_clmv2/execute/utune/debug.py",
"train_from_raw": true,
"world_size": 1,
"cpu_per_worker": 7,
"gpu_per_worker": 1
}