3v324v23 commited on
Commit
a560c36
·
0 Parent(s):

Brown-Tan: 25-11-2024

Browse files
Files changed (5) hide show
  1. .gitattributes +35 -0
  2. README.md +3 -0
  3. hotkey.txt +1 -0
  4. meta_model_0.pt +3 -0
  5. training_config.yml +83 -0
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ Time is the scarcest resource and unless it is managed nothing else can be managed.
2
+ =============
3
+ table-mango-bicycle-umbrella-piano
hotkey.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 5F9yGQDSazjhhs9cHXV9NXEbzVthkKqdwwv92wDyucHF1yTs
meta_model_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e34ee425dea4236208b1294c3b2b59fbdffdb5a6ae69f376c6580ca1927dc3
3
+ size 16219158403
training_config.yml ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _component_: models.lora_mmllama3_8b
3
+ lora_attn_modules:
4
+ - q_proj
5
+ - v_proj
6
+ apply_lora_to_mlp: false
7
+ apply_lora_to_output: false
8
+ lora_rank: 16
9
+ lora_alpha: 32
10
+ perception_tokens: 2
11
+ use_clip: false
12
+ tokenizer:
13
+ _component_: models.a2a_tokenizer
14
+ path: models/tokenizer.model
15
+ checkpointer:
16
+ _component_: torchtune.utils.FullModelMetaCheckpointer
17
+ checkpoint_dir: /workspace/omega_a2a/training
18
+ checkpoint_files:
19
+ - consolidated.00.pth
20
+ adapter_checkpoint: null
21
+ recipe_checkpoint: null
22
+ output_dir: /workspace/omega_a2a/checkpoints
23
+ model_type: LLAMA3
24
+ resume_from_checkpoint: false
25
+ interim_checkpoint_steps: 5000
26
+ interim_gen_steps: null
27
+ max_new_tokens: 170
28
+ temperature: 0.8
29
+ top_k: 200
30
+ dataset:
31
+ _component_: ds.EvenBatcher
32
+ buffer_size: 36
33
+ dataset:
34
+ _component_: ds.RoundRobinDataset
35
+ datasets:
36
+ - _component_: ds.OmegaVideoCaptionDataset
37
+ length: 500000
38
+ - _component_: ds.LlavaInstructDataset
39
+ dataset_path: ds/coco_llava_instruct/output.parquet
40
+ train_on_input: false
41
+ - _component_: ds.LlavaInstructDataset
42
+ dataset_path: ds/vision_flan/output.parquet
43
+ train_on_input: false
44
+ - _component_: ds.CaptionInstructDataset
45
+ dataset_path: ds/sam_llava/output.parquet
46
+ train_on_input: false
47
+ seed: null
48
+ shuffle: true
49
+ batch_size: 4
50
+ optimizer:
51
+ _component_: torch.optim.AdamW
52
+ weight_decay: 0.0001
53
+ lr: 3.0e-05
54
+ lr_scheduler:
55
+ _component_: torchtune.modules.get_cosine_schedule_with_warmup
56
+ num_warmup_steps: 100
57
+ loss:
58
+ _component_: torch.nn.CrossEntropyLoss
59
+ epochs: 6
60
+ max_steps_per_epoch: null
61
+ gradient_accumulation_steps: 64
62
+ compile: false
63
+ output_dir: /tmp/lora_finetune_output
64
+ metric_logger:
65
+ _component_: torchtune.utils.metric_logging.DiskLogger
66
+ log_dir: ${output_dir}
67
+ log_every_n_steps: null
68
+ device: cuda
69
+ dtype: bf16
70
+ enable_activation_checkpointing: false
71
+ profiler:
72
+ _component_: torchtune.utils.profiler
73
+ enabled: false
74
+ inference:
75
+ prompt_template: 'Video:
76
+
77
+ {video}
78
+
79
+ Caption the previous video.'
80
+ max_new_tokens: 170
81
+ temperature: 0.6
82
+ top_k: 200
83
+ quantizer: null