ztyang196 commited on
Commit
6bb28b7
·
verified ·
1 Parent(s): fbe0c3e

Delete captioner

Browse files
captioner/.DS_Store DELETED
Binary file (6.15 kB)
 
captioner/README.md DELETED
Binary file (264 Bytes)
 
captioner/adapter_config.json DELETED
@@ -1,26 +0,0 @@
1
- {
2
- "auto_mapping": null,
3
- "base_model_name_or_path": "llava-v1.5-13b",
4
- "bias": "none",
5
- "fan_in_fan_out": false,
6
- "inference_mode": true,
7
- "init_lora_weights": true,
8
- "layers_pattern": null,
9
- "layers_to_transform": null,
10
- "lora_alpha": 256,
11
- "lora_dropout": 0.05,
12
- "modules_to_save": null,
13
- "peft_type": "LORA",
14
- "r": 128,
15
- "revision": null,
16
- "target_modules": [
17
- "gate_proj",
18
- "up_proj",
19
- "q_proj",
20
- "v_proj",
21
- "o_proj",
22
- "k_proj",
23
- "down_proj"
24
- ],
25
- "task_type": "CAUSAL_LM"
26
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
captioner/adapter_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a75d4904466df96ba770230d096e0e976e3c0cd67b62c93e383cac35def1dbad
3
- size 2002974413
 
 
 
 
captioner/config.json DELETED
@@ -1,45 +0,0 @@
1
- {
2
- "_name_or_path": "captioner",
3
- "architectures": [
4
- "LlavaLlamaForCausalLM"
5
- ],
6
- "bos_token_id": 1,
7
- "eos_token_id": 2,
8
- "freeze_mm_mlp_adapter": false,
9
- "freeze_mm_vision_resampler": false,
10
- "hidden_act": "silu",
11
- "hidden_size": 5120,
12
- "image_aspect_ratio": "pad",
13
- "initializer_range": 0.02,
14
- "intermediate_size": 13824,
15
- "max_length": 4096,
16
- "max_position_embeddings": 4096,
17
- "mm_hidden_size": 1024,
18
- "mm_projector_lr": 2e-05,
19
- "mm_projector_type": "mlp2x_gelu",
20
- "mm_resampler_type": null,
21
- "mm_use_im_patch_token": false,
22
- "mm_use_im_start_end": false,
23
- "mm_vision_select_feature": "patch",
24
- "mm_vision_select_layer": -2,
25
- "mm_vision_tower": "/mnt/workspace/workgroup/temporary/zhantao/BACON/ckpt/clip-vit-large-patch14-336",
26
- "model_type": "llava_llama",
27
- "num_attention_heads": 40,
28
- "num_hidden_layers": 40,
29
- "num_key_value_heads": 40,
30
- "pad_token_id": 0,
31
- "pretraining_tp": 1,
32
- "rms_norm_eps": 1e-05,
33
- "rope_scaling": null,
34
- "tie_word_embeddings": false,
35
- "tokenizer_model_max_length": 4096,
36
- "tokenizer_padding_side": "right",
37
- "torch_dtype": "float16",
38
- "transformers_version": "4.31.0",
39
- "tune_mm_mlp_adapter": false,
40
- "tune_mm_vision_resampler": false,
41
- "unfreeze_mm_vision_tower": false,
42
- "use_cache": true,
43
- "use_mm_proj": true,
44
- "vocab_size": 32000
45
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
captioner/non_lora_trainables.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:de935c4cc6ef5ed1f0a883fd80874aac46e17d5bcc4f28f68de5cc2f30717898
3
- size 62936807
 
 
 
 
captioner/trainer_state.json DELETED
The diff for this file is too large to render. See raw diff