mrferr3t commited on
Commit
48cc53c
·
verified ·
1 Parent(s): 1ea482f

Training in progress, step 240, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d015affd6db158bedfd9fd25c50ae0db56683b4af68825771013d0c7f1761e7
3
  size 109009752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2ca6f541a9d128a71b52474f12655bf699880f16de2961187b92699c533fb7b
3
  size 109009752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d780d1844496ddf7c79f7bfe775e1ce1686bb74b6d42ed307c08192fcae54ba8
3
  size 56088148
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad5670142902563ea66cb6058b04d9c3cd19723cabb474739b676c163e64ddd3
3
  size 56088148
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c8446a0101b92101f9f087b8c34cf04dc6908f0b5cf93c2a4b2014185e0af79
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93f0ec112c9b0167a2c769cccced6910c1decb6450825497553afbf16ac1002d
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:628bd7f1457e043dd759d9a2b466e6a3738950f1815b17b82ee8d82f030b600e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9a5a02fd2f64af4b394ceffc9ffebe28abc2a4d62808bb3561346ca599f084
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 5.753882987846737e-07,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-220",
4
- "epoch": 1.4814814814814814,
5
  "eval_steps": 20,
6
- "global_step": 220,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -117,6 +117,14 @@
117
  "eval_samples_per_second": 28.744,
118
  "eval_steps_per_second": 0.92,
119
  "step": 220
 
 
 
 
 
 
 
 
120
  }
121
  ],
122
  "logging_steps": 100,
@@ -145,7 +153,7 @@
145
  "attributes": {}
146
  }
147
  },
148
- "total_flos": 9.290963685998592e+16,
149
  "train_batch_size": 8,
150
  "trial_name": null,
151
  "trial_params": null
 
1
  {
2
+ "best_metric": 5.237209279584931e-07,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-240",
4
+ "epoch": 1.6161616161616161,
5
  "eval_steps": 20,
6
+ "global_step": 240,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
117
  "eval_samples_per_second": 28.744,
118
  "eval_steps_per_second": 0.92,
119
  "step": 220
120
+ },
121
+ {
122
+ "epoch": 1.6161616161616161,
123
+ "eval_loss": 5.237209279584931e-07,
124
+ "eval_runtime": 4.3453,
125
+ "eval_samples_per_second": 28.767,
126
+ "eval_steps_per_second": 0.921,
127
+ "step": 240
128
  }
129
  ],
130
  "logging_steps": 100,
 
153
  "attributes": {}
154
  }
155
  },
156
+ "total_flos": 1.0135836769124352e+17,
157
  "train_batch_size": 8,
158
  "trial_name": null,
159
  "trial_params": null