impossibleexchange commited on
Commit
3e87275
·
verified ·
1 Parent(s): cac51de

Upload training_config.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yml +80 -0
training_config.yml ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _component_: models.lora_mmllama3_8b
3
+ lora_attn_modules:
4
+ - q_proj
5
+ - v_proj
6
+ apply_lora_to_mlp: false
7
+ apply_lora_to_output: false
8
+ lora_rank: 32
9
+ lora_alpha: 64
10
+ perception_tokens: 2
11
+ use_clip: false
12
+ tokenizer:
13
+ _component_: models.a2a_tokenizer
14
+ path: models/tokenizer.model
15
+ checkpointer:
16
+ _component_: torchtune.utils.FullModelMetaCheckpointer
17
+ checkpoint_dir: output_checkpoints/experiment_1
18
+ checkpoint_files:
19
+ - meta_model_5.pt
20
+ adapter_checkpoint: adapter_latest.pt
21
+ recipe_checkpoint: recipe_state.pt
22
+ output_dir: output_checkpoints/experiment_1
23
+ model_type: LLAMA3
24
+ resume_from_checkpoint: false
25
+ interim_checkpoint_steps: 20000
26
+ interim_gen_steps: null
27
+ max_new_tokens: 77
28
+ temperature: 0.8
29
+ top_k: 231
30
+ dataset:
31
+ _component_: ds.EvenBatcher
32
+ buffer_size: 128
33
+ dataset:
34
+ _component_: ds.RoundRobinDataset
35
+ datasets:
36
+ - _component_: ds.OmegaVideoCaptionDataset
37
+ length: 700000
38
+ seed: null
39
+ shuffle: true
40
+ batch_size: 1
41
+ optimizer:
42
+ _component_: torch.optim.AdamW
43
+ weight_decay: 0.003
44
+ lr: 0.0001
45
+ lr_scheduler:
46
+ _component_: torchtune.modules.get_cosine_schedule_with_warmup
47
+ num_warmup_steps: 1000
48
+ loss:
49
+ _component_: torch.nn.CrossEntropyLoss
50
+ label_smoothing: 0.1
51
+ grad_clip:
52
+ _component_: torch.nn.utils.clip_grad_norm_
53
+ max_norm: 1.0
54
+ norm_type: 2
55
+ epochs: 1
56
+ max_steps_per_epoch: null
57
+ gradient_accumulation_steps: 128
58
+ compile: false
59
+ output_dir: /tmp/lora_finetune_output
60
+ metric_logger:
61
+ _component_: torchtune.utils.metric_logging.DiskLogger
62
+ log_dir: ${output_dir}
63
+ log_every_n_steps: null
64
+ device: cuda
65
+ dtype: bf16
66
+ enable_activation_checkpointing: false
67
+ profiler:
68
+ _component_: torchtune.utils.profiler
69
+ enabled: false
70
+ inference:
71
+ prompt_template: 'Video:
72
+
73
+ {video}
74
+
75
+ Caption the previous video.'
76
+ max_new_tokens: 231
77
+ temperature: 0.8
78
+ top_k: 231
79
+ quantizer: null
80
+ gradient-accumulation-steps: 32