Training in progress, step 560, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb6cdf5d8b6226f6a41ae33f3f79fa018f920f25a94ad2acaf9fd20aabddde03
 size 109009752

 version https://git-lfs.github.com/spec/v1
+oid sha256:0d416b96ddb86b39acea285afa1c535ead42e497a733cb29207280e6c2f83fa7
 size 109009752

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5d87b2845003ad9c26f85337961d9910d627941cfca2166b4fd830e4304e7a5d
 size 56088788

 version https://git-lfs.github.com/spec/v1
+oid sha256:d337ec9fb2f1caa18ce4f33b9a96b7fcffd2a399f435bf0b35f9ff16c4c1ad17
 size 56088788

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7aafa5db1b56a982de2d1a0e669dfa9a2ace2d844876b7ab6c68d2ae587a2e2
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:1df3a3cae241082d68c3a6cb326bf131e93d4d808298cd38ff7f1baeee5d48f8
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fdc990d65d20244e2fe8b10836667fc181b3d1910eff3fd20bd309d901a413a6
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:bef42e564008e32e1ede623c5c541c27431e92ce859dc16d7a639dbd642b25ba
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 2.6893604854194564e-07,
   "best_model_checkpoint": "miner_id_24/checkpoint-540",
-  "epoch": 3.6363636363636362,
   "eval_steps": 20,
-  "global_step": 540,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -266,6 +266,14 @@
       "eval_samples_per_second": 28.484,
       "eval_steps_per_second": 0.912,
       "step": 540
     }
   ],
   "logging_steps": 100,
@@ -280,7 +288,7 @@
         "early_stopping_threshold": 0.0
       },
       "attributes": {
-        "early_stopping_patience_counter": 0
       }
     },
     "TrainerControl": {
@@ -294,7 +302,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.2803652559241216e+17,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 2.6893604854194564e-07,
   "best_model_checkpoint": "miner_id_24/checkpoint-540",
+  "epoch": 3.771043771043771,
   "eval_steps": 20,
+  "global_step": 560,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 28.484,
       "eval_steps_per_second": 0.912,
       "step": 540
+    },
+    {
+      "epoch": 3.771043771043771,
+      "eval_loss": 2.6898223381977004e-07,
+      "eval_runtime": 4.4647,
+      "eval_samples_per_second": 27.998,
+      "eval_steps_per_second": 0.896,
+      "step": 560
     }
   ],
   "logging_steps": 100,
         "early_stopping_threshold": 0.0
       },
       "attributes": {
+        "early_stopping_patience_counter": 1
       }
     },
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 2.3648525642366976e+17,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null