furau
/

PlatoLM-DPO

Model card Files Files and versions

PlatoLM-DPO / config.yaml

furau's picture

Upload 4 files

ae6c1c3 verified 6 months ago

history blame contribute delete

1.12 kB

	seed: 0
	exp_name: dpo_mistral_fsdp_bf16_hh_harmless
	batch_size: 8
	eval_batch_size: 16
	debug: false
	fsdp_port: 30287
	datasets:
	- hh
	wandb:
	enabled: true
	entity: renatz1224
	project: dpo
	api_key: d41bb0d59da8688d3d8f5371b1e3b3cfcced0f74
	local_dirs:
	- /mntcephfs/data/med/chuyi2/dpo
	sample_during_eval: false
	n_eval_model_samples: 16
	do_first_eval: true
	local_run_dir: /mntcephfs/data/med/chuyi2/dpo/kongchuyi/dpo_mistral_fsdp_bf16_hh_harmless_2024-02-21_19-35-15_643724
	lr: 5.0e-07
	gradient_accumulation_steps: 1
	max_grad_norm: 10.0
	max_length: 4096
	max_prompt_length: 2048
	n_epochs: 1
	n_examples: null
	n_eval_examples: 256
	trainer: FSDPTrainer
	optimizer: RMSprop
	warmup_steps: 50
	activation_checkpointing: true
	eval_every: 2000
	minimum_log_interval_secs: 1.0
	model:
	name_or_path: /mntnfs/med_data2/kcy/la2-mistral-30k/checkpoint-445
	tokenizer_name_or_path: /mntnfs/med_data2/kcy/la2-mistral-30k/checkpoint-445
	archive: null
	block_name: MistralDecoderLayer
	policy_dtype: bfloat16
	fsdp_policy_mp: bfloat16
	reference_dtype: float16
	loss:
	name: dpo
	beta: 0.1
	label_smoothing: 0
	reference_free: false