Training in progress, step 300, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a2e1190afdf08e6d245aebf19748bf09f95e5346d047e995a020fa32d7ee65af
 size 109009752

 version https://git-lfs.github.com/spec/v1
+oid sha256:afabeef02cd11af399f30d799a87cdcedf48e6b4b308ff1e8fd648227d65f416
 size 109009752

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f27951f81528848db415822bf71fb9a83a227168152ca7c9b4634214b845ff2a
 size 56088788

 version https://git-lfs.github.com/spec/v1
+oid sha256:db08a3ed0537b4834693fbc56c2a76f165e2d16d1f603f5b5c5e165ccb95904a
 size 56088788

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a4c5e895fc749303e186af008c616cc4691ee11e5379819a9cef8abc9244ae4
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c130768bbf9cce1ebe68f09044324e0bfed8c7b5372544cfaddcff885c19347
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bcff232e369592911db2b4e3df034b850aaaa5664b471617ca7ce83896190c8a
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:3eda02c74ec58a373b407bd46f7ba99a11b2d14ed57d7fd11002c322f6ba0709
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-  "best_metric": 4.489497769100126e-07,
-  "best_model_checkpoint": "miner_id_24/checkpoint-280",
-  "epoch": 1.8855218855218854,
   "eval_steps": 20,
-  "global_step": 280,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -141,6 +141,21 @@
       "eval_samples_per_second": 28.669,
       "eval_steps_per_second": 0.917,
       "step": 280
     }
   ],
   "logging_steps": 100,
@@ -169,7 +184,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.1825582935375872e+17,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 4.185091029285104e-07,
+  "best_model_checkpoint": "miner_id_24/checkpoint-300",
+  "epoch": 2.0202020202020203,
   "eval_steps": 20,
+  "global_step": 300,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 28.669,
       "eval_steps_per_second": 0.917,
       "step": 280
+    },
+    {
+      "epoch": 2.0202020202020203,
+      "grad_norm": 1.0282737093803007e-05,
+      "learning_rate": 0.00019721004253231048,
+      "loss": 0.0,
+      "step": 300
+    },
+    {
+      "epoch": 2.0202020202020203,
+      "eval_loss": 4.185091029285104e-07,
+      "eval_runtime": 4.3862,
+      "eval_samples_per_second": 28.499,
+      "eval_steps_per_second": 0.912,
+      "step": 300
     }
   ],
   "logging_steps": 100,
       "attributes": {}
     }
   },
+  "total_flos": 1.2667815790116864e+17,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null