Upload folder using huggingface_hub

Files changed (7) hide show

added_tokens.json CHANGED Viewed

@@ -1,12 +1,13 @@
 {
-  "[IMG0]": 32000,
-  "[IMG1]": 32001,
-  "[IMG2]": 32002,
-  "[IMG3]": 32003,
-  "[IMG4]": 32004,
-  "[IMG5]": 32005,
-  "[IMG6]": 32006,
-  "[IMG7]": 32007,
-  "[IMG8]": 32008,
-  "[IMG9]": 32009
 }

 {
+  "[IMG0]": 32001,
+  "[IMG1]": 32002,
+  "[IMG2]": 32003,
+  "[IMG3]": 32004,
+  "[IMG4]": 32005,
+  "[IMG5]": 32006,
+  "[IMG6]": 32007,
+  "[IMG7]": 32008,
+  "[IMG8]": 32009,
+  "[IMG9]": 32010,
+  "[SCORE]": 32000
 }

config.json CHANGED Viewed

@@ -5,7 +5,7 @@
   ],
   "attention_bias": false,
   "bos_token_id": 1,
-  "ce_weight": 0.0,
   "emd_weight": 0.0,
   "eos_token_id": 2,
   "freeze_vision_model": false,
@@ -17,7 +17,6 @@
   "initializer_range": 0.02,
   "intermediate_size": 11008,
   "l1_weight": 0.0,
-  "level": false,
   "max_position_embeddings": 2048,
   "max_score": 10,
   "min_score": 1,
@@ -39,14 +38,14 @@
   "num_hidden_layers": 32,
   "num_key_value_heads": 32,
   "num_tokens": 10,
-  "output_first_id": 32000,
-  "output_last_id": 32009,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000.0,
   "tie_word_embeddings": false,
-  "token_weight": 15.0,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.31.0",
   "tune_visual_abstractor": true,
@@ -206,5 +205,5 @@
       "use_flash_attn": false
     }
   },
-  "vocab_size": 32010
 }

   ],
   "attention_bias": false,
   "bos_token_id": 1,
+  "ce_weight": 1.0,
   "emd_weight": 0.0,
   "eos_token_id": 2,
   "freeze_vision_model": false,
   "initializer_range": 0.02,
   "intermediate_size": 11008,
   "l1_weight": 0.0,
   "max_position_embeddings": 2048,
   "max_score": 10,
   "min_score": 1,
   "num_hidden_layers": 32,
   "num_key_value_heads": 32,
   "num_tokens": 10,
+  "output_first_id": 32001,
+  "output_last_id": 32010,
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000.0,
+  "score_id": 32000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.31.0",
   "tune_visual_abstractor": true,
       "use_flash_attn": false
     }
   },
+  "vocab_size": 32011
 }

pytorch_model-00001-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa6dd3cf731fcf0059db05e32868dca32109b7b91f4216cf6dc0515d35c87838
-size 9991673905

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6f425277b735736e9f034b5b9389332441e22fcedb22b3e73abc89c0b4a860b
+size 9991682097

pytorch_model-00002-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:905727fa8a677db5ceab6391c4df593a00f980e1af8f2dddf3110e2c239f4267
-size 6417912890

 version https://git-lfs.github.com/spec/v1
+oid sha256:d43cd91bbc03fb08c19be9636228454b63b0351e58d8ff7c55d3f1c3556ae462
+size 6417921082

pytorch_model.bin.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 16409268226
   },
   "weight_map": {
     "learned_weight": "pytorch_model-00001-of-00002.bin",

 {
   "metadata": {
+    "total_size": 16409284610
   },
   "weight_map": {
     "learned_weight": "pytorch_model-00001-of-00002.bin",

trainer_state.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ad17c8b05629df0466455149bfa645a787bb67afcb762311a0362f30e92c7b5d
-size 6011

 version https://git-lfs.github.com/spec/v1
+oid sha256:9bb7fc4c325c5f0d1d3f37f7b4903cc48160d7dfc97e6eabcc25d3d491750527
+size 5947