auxyus commited on
Commit
b197ff6
·
verified ·
1 Parent(s): 03fd114

Training in progress, step 63, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62684bf0eec044fb0a9a60709738b246e464592f15969ca36cbd206f6a65b9ba
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2453b22f077c9e633155bde5a44c5a5c92ddb254cf0fe9e618e76bbd38133b08
3
  size 167832240
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ba68244a466bdf0b5d267bb6e43fc63894926d785d1e87c91c9b950737d9101
3
  size 85723284
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e79d76de3a27d79eb105caffe8c2ea0c9c2c134159ec637025bffdd723a230d4
3
  size 85723284
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60379b7ec7fc50400ed25c0728f72548d8aacb996c92794cc4fa8f2026f83ce9
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ade06f0db401bf7db7e4bf579716041b8a433a97a601335efdecad97edb03945
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2011b1e019073e4bafc29de9703ff0a6e7c1252c3a53d804807bd1c99d390d1c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e53b95eff99f2334cbf7ed4c962db83cb42e931305982518e928382563b5670d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.006502694403468103,
5
  "eval_steps": 9,
6
- "global_step": 54,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -189,6 +189,35 @@
189
  "eval_samples_per_second": 7.035,
190
  "eval_steps_per_second": 0.88,
191
  "step": 54
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
192
  }
193
  ],
194
  "logging_steps": 3,
@@ -208,7 +237,7 @@
208
  "attributes": {}
209
  }
210
  },
211
- "total_flos": 1.518761456613458e+17,
212
  "train_batch_size": 8,
213
  "trial_name": null,
214
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.007586476804046121,
5
  "eval_steps": 9,
6
+ "global_step": 63,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
189
  "eval_samples_per_second": 7.035,
190
  "eval_steps_per_second": 0.88,
191
  "step": 54
192
+ },
193
+ {
194
+ "epoch": 0.006863955203660776,
195
+ "grad_norm": 14.141239166259766,
196
+ "learning_rate": 4.6512176312793736e-05,
197
+ "loss": 5.6544,
198
+ "step": 57
199
+ },
200
+ {
201
+ "epoch": 0.007225216003853448,
202
+ "grad_norm": 13.24157428741455,
203
+ "learning_rate": 4.131759111665349e-05,
204
+ "loss": 5.7787,
205
+ "step": 60
206
+ },
207
+ {
208
+ "epoch": 0.007586476804046121,
209
+ "grad_norm": 13.354693412780762,
210
+ "learning_rate": 3.6218132209150045e-05,
211
+ "loss": 5.9927,
212
+ "step": 63
213
+ },
214
+ {
215
+ "epoch": 0.007586476804046121,
216
+ "eval_loss": 1.4332555532455444,
217
+ "eval_runtime": 1985.8578,
218
+ "eval_samples_per_second": 7.043,
219
+ "eval_steps_per_second": 0.881,
220
+ "step": 63
221
  }
222
  ],
223
  "logging_steps": 3,
 
237
  "attributes": {}
238
  }
239
  },
240
+ "total_flos": 1.7718883660490342e+17,
241
  "train_batch_size": 8,
242
  "trial_name": null,
243
  "trial_params": null