mrferr3t commited on
Commit
3dc78b5
·
verified ·
1 Parent(s): 5a8a37b

Training in progress, step 380, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27dcec798f401aea531332fd52d47af4e2e2052534e106a38738f74d8310f559
3
  size 109009752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14c1fd6535b1947d88953614c47802dd8b81a013bb8594bc2fa89f725857c9ac
3
  size 109009752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5f75e289bb3450e55503e27675a790d9ae74e663bd5176ca0036dc79eed1f7f
3
  size 56088788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c946b2c89717f2d9b83962c1fea716d72aa3ccdf0862f8da941b1f3acef991a
3
  size 56088788
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f464ee492959ca51f31ddd6c918f5e6ed3b897ddaa5bd27211176d3e42d4533
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8966b15f85185715dd994ab5a2d54fa29563cc2e5c4c1515e4dbf61731e57b3f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96a1a67751ef8c6e878b8ba1ee8cfd48efab59bef2ad58f80bf89ebc2ab37857
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8092b14896167cec4bcd41544a9706c780edac6d6d1675e384862c5b2b347c56
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 3.503983521113696e-07,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-360",
4
- "epoch": 2.4242424242424243,
5
  "eval_steps": 20,
6
- "global_step": 360,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -180,6 +180,14 @@
180
  "eval_samples_per_second": 28.493,
181
  "eval_steps_per_second": 0.912,
182
  "step": 360
 
 
 
 
 
 
 
 
183
  }
184
  ],
185
  "logging_steps": 100,
@@ -208,7 +216,7 @@
208
  "attributes": {}
209
  }
210
  },
211
- "total_flos": 1.5202435039494144e+17,
212
  "train_batch_size": 8,
213
  "trial_name": null,
214
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.3884660410876677e-07,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-380",
4
+ "epoch": 2.558922558922559,
5
  "eval_steps": 20,
6
+ "global_step": 380,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
180
  "eval_samples_per_second": 28.493,
181
  "eval_steps_per_second": 0.912,
182
  "step": 360
183
+ },
184
+ {
185
+ "epoch": 2.558922558922559,
186
+ "eval_loss": 3.3884660410876677e-07,
187
+ "eval_runtime": 4.549,
188
+ "eval_samples_per_second": 27.478,
189
+ "eval_steps_per_second": 0.879,
190
+ "step": 380
191
  }
192
  ],
193
  "logging_steps": 100,
 
216
  "attributes": {}
217
  }
218
  },
219
+ "total_flos": 1.6047308122619904e+17,
220
  "train_batch_size": 8,
221
  "trial_name": null,
222
  "trial_params": null