Update model weights after training (epoch 1, loss 4.0192)

Files changed (7) hide show

audio_decoder.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:37e38d5f45ab1bb841c51d43d1a830339c9554d7b7121b40c29543be6b8bb246
 size 1458415836

 version https://git-lfs.github.com/spec/v1
+oid sha256:9cc0af3086d6987e71c00b7121394b8ac820d2276ff994014479d4fc2cf094bf
 size 1458415836

cross_attention.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7967eb8d40a1c69ade87aaae8872447a9f3b28418fadde6d1a8f876d96a6848
 size 174191400

 version https://git-lfs.github.com/spec/v1
+oid sha256:9034e718a6461ed04d5723c8ecf429d0daedb7fc49274a1fbd17b80bb9dd77b9
 size 174191400

generator.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89ea74af2d5ac45430e7dc96fd17ddf368b8baa87a4133046782ec32e7a63224
 size 629440508

 version https://git-lfs.github.com/spec/v1
+oid sha256:02673bab0a9e2949c2f3bfe0725ff77cd631fd89a559d86e9c886c99455a5e72
 size 629440508

llm.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96e14153b590b91954c672ba79a681cd40c08dfc82dcb9e5500e87c2d8d23c83
 size 1506831304

 version https://git-lfs.github.com/spec/v1
+oid sha256:b4ce3c75e0ec09d93c0580ed862f12191e3ea3bd53ab8906e0108cafd5d6fc18
 size 1506831304

streaming_state.json CHANGED Viewed

@@ -1,26 +1,26 @@
 {
-  "epoch": 4,
-  "unique_samples": 800,
-  "total_yields": 1600,
   "dataset_positions": {
-    "WebSight": 136,
-    "ScienceQA": 114,
-    "InstructPix2Pix": 136,
-    "Flickr8k": 136,
-    "NewYorker": 136,
     "Football": 6,
-    "MagicBrush": 136
   },
   "modality_positions": {
     "text": {},
     "image": {
-      "WebSight": 136,
-      "ScienceQA": 114,
-      "InstructPix2Pix": 136,
-      "Flickr8k": 136,
-      "NewYorker": 136,
       "Football": 6,
-      "MagicBrush": 136
     },
     "video": {},
     "audio": {}

 {
+  "epoch": 5,
+  "unique_samples": 1100,
+  "total_yields": 2200,
   "dataset_positions": {
+    "WebSight": 186,
+    "ScienceQA": 164,
+    "InstructPix2Pix": 186,
+    "Flickr8k": 186,
+    "NewYorker": 186,
     "Football": 6,
+    "MagicBrush": 186
   },
   "modality_positions": {
     "text": {},
     "image": {
+      "WebSight": 186,
+      "ScienceQA": 164,
+      "InstructPix2Pix": 186,
+      "Flickr8k": 186,
+      "NewYorker": 186,
       "Football": 6,
+      "MagicBrush": 186
     },
     "video": {},
     "audio": {}

trainer_state.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "best_model_checkpoint": "/kaggle/working/xoron-final",
-  "best_metric": 4.291641629748046,
   "epoch": 1,
   "epochs_completed": 1,
   "global_step": 37,

 {
   "best_model_checkpoint": "/kaggle/working/xoron-final",
+  "best_metric": 4.019162586334472,
   "epoch": 1,
   "epochs_completed": 1,
   "global_step": 37,

training_state.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9329bf26836f4da61c1deaa53cc9d62b880df8b96c33af2739c8288691dd2b3a
-size 1419713437

 version https://git-lfs.github.com/spec/v1
+oid sha256:cff88f1a8ee14094dfffadc0ac06d52480a2d90bd740252423ecf77cdef8f6cc
+size 1419723549