# Template config, need to change dump_dir, data.root_dir and tokenizer.path # dump_dir: !!CHANGETHIS!! name: "debug" steps: 1000 # probe_freq: 100 seed: 777 optim: lr: 3e-4 warmup: 2000 lr_min_ratio: 0.000001 clip: 1.0 distributed: fsdp_type: full_shard compile: true model_dtype: bf16 matmul_allow_tf32: false selective_activation_checkpointing: false tp_size: 1 detect_anomaly: true model_type: "hawk" model: dim: 1024 n_layers: 8 n_heads: 8 conv_size: 4 data: root_dir: data/shuffled sources: dclm_baseline_1.0: 1.0 batch_size: 32 prefetch_size: 64 seq_len: 2048 n_views: 2 load_async: true tokenizer: name: sp path: tokenizers/tokenizer_final_32k.minus_inf_ws.model profiling: run: true checkpoint: dump: every: 100 keep: 1 eval: every: 100 keep: 1 logging: freq: 10 eval: generator: max_tokens: 8192 dtype: bf16 temperature: 1.0 top_p: 0.95 harness: tasks: - hellaswag - piqa - task: nq_open num_fewshot: 5 validation: max_steps: 100