impossibleexchange commited on
Commit
9ec9c4e
·
verified ·
1 Parent(s): aa510b0

Delete training_config.yml

Browse files
Files changed (1) hide show
  1. training_config.yml +0 -93
training_config.yml DELETED
@@ -1,93 +0,0 @@
1
- model:
2
- _component_: models.lora_mmllama3_8b
3
- lora_attn_modules:
4
- - q_proj
5
- - v_proj
6
- apply_lora_to_mlp: false
7
- apply_lora_to_output: false
8
- lora_rank: 16
9
- lora_alpha: 32
10
- perception_tokens: 2
11
- use_clip: false
12
- tokenizer:
13
- _component_: models.a2a_tokenizer
14
- path: models/tokenizer.model
15
- freeze_layers:
16
- _component_: torchtune.utils.Freeze_Layers
17
- num_layers: 8
18
- checkpointer:
19
- _component_: torchtune.utils.FullModelMetaCheckpointer
20
- checkpoint_dir: output_checkpoints/experiment_1
21
- checkpoint_files:
22
- - meta_model_0.pt
23
- adapter_checkpoint: null
24
- recipe_checkpoint: null
25
- output_dir: output_checkpoints/experiment_1
26
- model_type: LLAMA3
27
- use_freeze_layers: true
28
- resume_from_checkpoint: false
29
- interim_checkpoint_steps: 20000
30
- interim_gen_steps: null
31
- max_new_tokens: 100
32
- temperature: 0.6
33
- top_k: 225
34
- dataset:
35
- _component_: ds.EvenBatcher
36
- buffer_size: 1000
37
- datasets:
38
- - _component_: ds.OmegaVideoCaptionDataset
39
- length: 500000
40
- - _component_: ds.LlavaInstructDataset
41
- dataset_path: ds/coco_llava_instruct/output.parquet
42
- train_on_input: false
43
- - _component_: ds.LlavaInstructDataset
44
- dataset_path: ds/vision_flan/output.parquet
45
- train_on_input: false
46
- - _component_: ds.CaptionInstructDataset
47
- dataset_path: ds/sam_llava/output.parquet
48
- train_on_input: false
49
- seed: null
50
- shuffle: true
51
- batch_size: 2
52
- optimizer:
53
- _component_: torch.optim.AdamW
54
- weight_decay: 0.0001
55
- lr: 0.0001
56
- betas:
57
- - 0.9
58
- - 0.998
59
- lr_scheduler:
60
- _component_: torchtune.modules.get_cosine_schedule_with_warmup
61
- num_warmup_steps: 500
62
- loss:
63
- _component_: torch.nn.CrossEntropyLoss
64
- grad_clip:
65
- _component_: torch.nn.utils.clip_grad_norm
66
- max_norm: 2.0
67
- norm_type: 2
68
- epochs: 6
69
- max_steps_per_epoch: null
70
- gradient_accumulation_steps: 32
71
- compile: true
72
- output_dir: /tmp/lora_finetune_output
73
- metric_logger:
74
- _component_: torchtune.utils.metric_logging.DiskLogger
75
- log_dir: ${output_dir}
76
- log_every_n_steps: null
77
- device: cuda
78
- dtype: bf16
79
- enable_activation_checkpointing: false
80
- profiler:
81
- _component_: torchtune.utils.profiler
82
- enabled: true
83
- inference:
84
- prompt_template: 'Video:
85
-
86
- {video}
87
-
88
- Caption the previous video.'
89
- max_new_tokens: 300
90
- temperature: 0.6
91
- top_k: 300
92
- quantizer: null
93
- gradient-accumulation-steps: 32