|
|
trainer:
|
|
|
nnodes: 1
|
|
|
n_gpus_per_node: 1
|
|
|
|
|
|
data:
|
|
|
path: ./data/parquet/test.parquet
|
|
|
prompt_key: prompt
|
|
|
n_samples: 1
|
|
|
output_path: ./checkpoints/grammar_generation.parquet
|
|
|
batch_size: 1
|
|
|
|
|
|
model:
|
|
|
path: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
|
|
|
external_lib: null
|
|
|
load_param: False
|
|
|
load_param_path: null
|
|
|
|
|
|
rollout:
|
|
|
name: vllm
|
|
|
mode: sync
|
|
|
temperature: 0.0
|
|
|
top_k: -1
|
|
|
top_p: 1.0
|
|
|
max_loras: 1
|
|
|
prompt_length: 1800
|
|
|
response_length: 512
|
|
|
|
|
|
dtype: bfloat16
|
|
|
gpu_memory_utilization: 0.9
|
|
|
ignore_eos: False
|
|
|
enforce_eager: True
|
|
|
free_cache_engine: True
|
|
|
load_format: dummy_dtensor
|
|
|
tensor_model_parallel_size: 1
|
|
|
max_num_batched_tokens: 8192
|
|
|
max_model_len: 1800
|
|
|
max_num_seqs: 1024
|
|
|
log_prob_micro_batch_size: null
|
|
|
log_prob_micro_batch_size_per_gpu: 1
|
|
|
|
|
|
use_fire_sampling: False
|
|
|
|
|
|
do_sample: True
|
|
|
disable_log_stats: False
|
|
|
enable_chunked_prefill: True
|
|
|
n: 1
|
|
|
|
|
|
|
|
|
actor:
|
|
|
strategy: fsdp
|
|
|
ulysses_sequence_parallel_size: 1
|
|
|
fsdp_config:
|
|
|
fsdp_size: -1
|
|
|
|
|
|
ray_init:
|
|
|
num_cpus: null
|
|
|
|