mrferr3t commited on
Commit
4fae396
·
verified ·
1 Parent(s): d36c999

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcc457fd82f27efdda10fed960e386036a4b33abb33221deb7837e50eb062a57
3
  size 111454040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e969e52342803b299b7ed319dcf94e15a8c84105f20d3e213c87987284453833
3
  size 111454040
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe9f1bff8d6faa01cf6769f239cc539972d3f7c6cc4228301e1f324d9e8af757
3
  size 56950996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4cb59a5ee934befa564064aaaf64c328c626a692b4093f3e04137e10811edf2
3
  size 56950996
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed7a65e4257438282c61302a05f6983560de4e3a6f299917cf5ff5127f020898
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf3db837f33a4e5d1f0863b8fcce835716b9cd562fb153c4a26c2c7dce10c99d
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d1f0f5a6a174cd37a4de7168d2654831d469666ae99ac8ac3662c8eaf7683b5
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3fefa9335f6222d1a14d72f837041665420095d7f813e43c216743bd291bfe3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.5773412585258484,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-880",
4
- "epoch": 0.9948186528497409,
5
  "eval_steps": 40,
6
- "global_step": 960,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -270,6 +270,21 @@
270
  "eval_samples_per_second": 9.715,
271
  "eval_steps_per_second": 0.333,
272
  "step": 960
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
273
  }
274
  ],
275
  "logging_steps": 100,
@@ -284,7 +299,7 @@
284
  "early_stopping_threshold": 0.0
285
  },
286
  "attributes": {
287
- "early_stopping_patience_counter": 2
288
  }
289
  },
290
  "TrainerControl": {
@@ -293,12 +308,12 @@
293
  "should_evaluate": false,
294
  "should_log": false,
295
  "should_save": true,
296
- "should_training_stop": false
297
  },
298
  "attributes": {}
299
  }
300
  },
301
- "total_flos": 3.128126001905664e+17,
302
  "train_batch_size": 2,
303
  "trial_name": null,
304
  "trial_params": null
 
1
  {
2
  "best_metric": 0.5773412585258484,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-880",
4
+ "epoch": 1.0362694300518134,
5
  "eval_steps": 40,
6
+ "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
270
  "eval_samples_per_second": 9.715,
271
  "eval_steps_per_second": 0.333,
272
  "step": 960
273
+ },
274
+ {
275
+ "epoch": 1.0362694300518134,
276
+ "grad_norm": 0.8339794278144836,
277
+ "learning_rate": 0.000299768901482495,
278
+ "loss": 1.0328,
279
+ "step": 1000
280
+ },
281
+ {
282
+ "epoch": 1.0362694300518134,
283
+ "eval_loss": 0.5930935740470886,
284
+ "eval_runtime": 21.0358,
285
+ "eval_samples_per_second": 9.698,
286
+ "eval_steps_per_second": 0.333,
287
+ "step": 1000
288
  }
289
  ],
290
  "logging_steps": 100,
 
299
  "early_stopping_threshold": 0.0
300
  },
301
  "attributes": {
302
+ "early_stopping_patience_counter": 3
303
  }
304
  },
305
  "TrainerControl": {
 
308
  "should_evaluate": false,
309
  "should_log": false,
310
  "should_save": true,
311
+ "should_training_stop": true
312
  },
313
  "attributes": {}
314
  }
315
  },
316
+ "total_flos": 3.258924645482496e+17,
317
  "train_batch_size": 2,
318
  "trial_name": null,
319
  "trial_params": null