error577 commited on
Commit
22e73da
·
verified ·
1 Parent(s): da056f9

Training in progress, step 18, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79ef18e08a9c17b2fb9b8ccde982a8239483cde795247827af7cb580503bb16a
3
  size 40036040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ea5682a32e67553733161e24919b8256171520aaf9a72fb6461c8d023334b0f
3
  size 40036040
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:944c8456b3e58c34cea3f7a300e3a051a0c84fd9656d9059a82ebdf9469ba1c5
3
  size 20814996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8417a2e0bd9dee93861abecea4888b406a923187a5ec3ba715ab84d9297bc24
3
  size 20814996
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38d4ce98297dbe9ce16d8aeca4ab3d4f1f6ecfc395ce39836ce23e0f5364d053
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12da8cf14faf21b4ce97a203fbc022d55852967af79c15ad0d9fb35a64362e46
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73cbf425fe8e079f586aa4701c8340389c70a4705a912add7a2c0a4fa520c8a7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae75e092a889d5e969a2ae073023153d014a68766ac86876f11258c486a735da
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.023732270325391675,
5
  "eval_steps": 2,
6
- "global_step": 16,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -191,6 +191,28 @@
191
  "eval_samples_per_second": 3.755,
192
  "eval_steps_per_second": 3.755,
193
  "step": 16
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
194
  }
195
  ],
196
  "logging_steps": 1,
@@ -210,7 +232,7 @@
210
  "attributes": {}
211
  }
212
  },
213
- "total_flos": 2602068892188672.0,
214
  "train_batch_size": 1,
215
  "trial_name": null,
216
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.026698804116065636,
5
  "eval_steps": 2,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
191
  "eval_samples_per_second": 3.755,
192
  "eval_steps_per_second": 3.755,
193
  "step": 16
194
+ },
195
+ {
196
+ "epoch": 0.025215537220728654,
197
+ "grad_norm": 25.165361404418945,
198
+ "learning_rate": 4.12214747707527e-05,
199
+ "loss": 4.9765,
200
+ "step": 17
201
+ },
202
+ {
203
+ "epoch": 0.026698804116065636,
204
+ "grad_norm": 14.660453796386719,
205
+ "learning_rate": 1.9098300562505266e-05,
206
+ "loss": 1.5801,
207
+ "step": 18
208
+ },
209
+ {
210
+ "epoch": 0.026698804116065636,
211
+ "eval_loss": 0.34035831689834595,
212
+ "eval_runtime": 151.1958,
213
+ "eval_samples_per_second": 3.757,
214
+ "eval_steps_per_second": 3.757,
215
+ "step": 18
216
  }
217
  ],
218
  "logging_steps": 1,
 
232
  "attributes": {}
233
  }
234
  },
235
+ "total_flos": 2927327503712256.0,
236
  "train_batch_size": 1,
237
  "trial_name": null,
238
  "trial_params": null