Update model weights after training (epoch 1, loss 4.2916)

Files changed (11) hide show

audio_decoder.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e80dd44856ab9de02baf7f75a2388092434554d243ed896b8d27b382470efbb0
 size 1458415836

 version https://git-lfs.github.com/spec/v1
+oid sha256:37e38d5f45ab1bb841c51d43d1a830339c9554d7b7121b40c29543be6b8bb246
 size 1458415836

cross_attention.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:431b826b0b603dc6fe556705ad128da3e3ad62916bbf682cf56054dfc1f82971
 size 174191400

 version https://git-lfs.github.com/spec/v1
+oid sha256:f7967eb8d40a1c69ade87aaae8872447a9f3b28418fadde6d1a8f876d96a6848
 size 174191400

generator.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77991e08ee440c540d1fd2cbf8e8d83e87f62aac203e71adfa2182086a041aa2
 size 629440508

 version https://git-lfs.github.com/spec/v1
+oid sha256:89ea74af2d5ac45430e7dc96fd17ddf368b8baa87a4133046782ec32e7a63224
 size 629440508

llm.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8e8d0ac87d7bb273d16a5a89ac99ec879ce0981a19c5b34078e00e080bd447a5
 size 1506831304

 version https://git-lfs.github.com/spec/v1
+oid sha256:96e14153b590b91954c672ba79a681cd40c08dfc82dcb9e5500e87c2d8d23c83
 size 1506831304

sample_images/epoch1_sample1.png ADDED Viewed

sample_images/epoch1_sample2.png ADDED Viewed

sample_images/epoch1_sample3.png ADDED Viewed

streaming_state.json CHANGED Viewed

@@ -1,33 +1,33 @@
 {
-  "epoch": 3,
-  "unique_samples": 500,
-  "total_yields": 1000,
   "dataset_positions": {
-    "WebSight": 86,
-    "ScienceQA": 64,
-    "InstructPix2Pix": 86,
-    "Flickr8k": 86,
-    "NewYorker": 86,
     "Football": 6,
-    "MagicBrush": 86
   },
   "modality_positions": {
     "text": {},
     "image": {
-      "WebSight": 86,
-      "ScienceQA": 64,
-      "InstructPix2Pix": 86,
-      "Flickr8k": 86,
-      "NewYorker": 86,
       "Football": 6,
-      "MagicBrush": 86
     },
     "video": {},
     "audio": {}
   },
   "modality_counts": {
     "text": 0,
-    "image": 0,
     "video": 0,
     "audio": 0
   },

 {
+  "epoch": 4,
+  "unique_samples": 800,
+  "total_yields": 1600,
   "dataset_positions": {
+    "WebSight": 136,
+    "ScienceQA": 114,
+    "InstructPix2Pix": 136,
+    "Flickr8k": 136,
+    "NewYorker": 136,
     "Football": 6,
+    "MagicBrush": 136
   },
   "modality_positions": {
     "text": {},
     "image": {
+      "WebSight": 136,
+      "ScienceQA": 114,
+      "InstructPix2Pix": 136,
+      "Flickr8k": 136,
+      "NewYorker": 136,
       "Football": 6,
+      "MagicBrush": 136
     },
     "video": {},
     "audio": {}
   },
   "modality_counts": {
     "text": 0,
+    "image": 300,
     "video": 0,
     "audio": 0
   },

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b48623d7dbbb520d1da2833656a41ab6878dd0254184667ea2c8dfeed1e3f61d
-size 11522951

 version https://git-lfs.github.com/spec/v1
+oid sha256:d27d705d6b96a348ab0adece83feb6480983d947f7be700666328942f89381b5
+size 11523225

trainer_state.json CHANGED Viewed

@@ -1,14 +1,14 @@
 {
   "best_model_checkpoint": "/kaggle/working/xoron-final",
-  "best_metric": 0.0,
   "epoch": 1,
   "epochs_completed": 1,
-  "global_step": 0,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [],
   "logging_steps": 50,
-  "max_steps": 0,
   "num_train_epochs": 1,
   "total_flos": 0,
   "train_batch_size": 1,

 {
   "best_model_checkpoint": "/kaggle/working/xoron-final",
+  "best_metric": 4.291641629748046,
   "epoch": 1,
   "epochs_completed": 1,
+  "global_step": 37,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [],
   "logging_steps": 50,
+  "max_steps": 37,
   "num_train_epochs": 1,
   "total_flos": 0,
   "train_batch_size": 1,

training_state.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3813547fac897078f6b9545389496768018915ce23a16b9cc586db71e1f146a4
-size 5143

 version https://git-lfs.github.com/spec/v1
+oid sha256:9329bf26836f4da61c1deaa53cc9d62b880df8b96c33af2739c8288691dd2b3a
+size 1419713437