End of training

Files changed (5) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 0.0,
-    "train_loss": 5.925413926080284e-07,
-    "train_runtime": 35343.127,
     "train_samples": 45000,
-    "train_samples_per_second": 0.013,
-    "train_steps_per_second": 0.013
 }

 {
     "total_flos": 0.0,
+    "train_loss": 1.3050906145387637e-09,
+    "train_runtime": 4363.1554,
     "train_samples": 45000,
+    "train_samples_per_second": 0.103,
+    "train_steps_per_second": 0.103
 }

runs/Feb05_11-56-04_AVA-STATION/events.out.tfevents.1738752970.AVA-STATION.622808.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2ce2e9c2b0b18ba719590a91665a096f24a7f5edaa1581d8e231d7d1b8d7cf3
+size 6109

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 0.0,
-    "train_loss": 5.925413926080284e-07,
-    "train_runtime": 35343.127,
     "train_samples": 45000,
-    "train_samples_per_second": 0.013,
-    "train_steps_per_second": 0.013
 }

 {
     "total_flos": 0.0,
+    "train_loss": 1.3050906145387637e-09,
+    "train_runtime": 4363.1554,
     "train_samples": 45000,
+    "train_samples_per_second": 0.103,
+    "train_steps_per_second": 0.103
 }

trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.01,
   "eval_steps": 500,
-  "global_step": 450,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -594,13 +594,19 @@
       "step": 450
     },
     {
-      "epoch": 0.01,
-      "step": 450,
       "total_flos": 0.0,
-      "train_loss": 5.925413926080284e-07,
-      "train_runtime": 35343.127,
-      "train_samples_per_second": 0.013,
-      "train_steps_per_second": 0.013
     }
   ],
   "logging_steps": 10,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.010022222222222222,
   "eval_steps": 500,
+  "global_step": 451,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "step": 450
     },
     {
+      "completion_length": 379.875,
+      "epoch": 0.010022222222222222,
+      "kl": 0.0005991907673887908,
+      "reward": 0.375,
+      "reward_std": 0.5175491571426392,
+      "rewards/equation_reward_func": 0.0,
+      "rewards/format_reward_func": 0.375,
+      "step": 451,
       "total_flos": 0.0,
+      "train_loss": 1.3050906145387637e-09,
+      "train_runtime": 4363.1554,
+      "train_samples_per_second": 0.103,
+      "train_steps_per_second": 0.103
     }
   ],
   "logging_steps": 10,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d875b2ce3ec833cc1adfdd719f3e676ad7c17cebd64ffc4e6f8bed2655a8f164
 size 5624

 version https://git-lfs.github.com/spec/v1
+oid sha256:f712c19fc1e1946e5e4bb43eccae4449788e72205cdd94458e1f84efc985453b
 size 5624