mrferr3t commited on
Commit
53985b4
·
verified ·
1 Parent(s): bdfc7e5

Training in progress, step 360, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7384e6e0afd8f05180f65c96007714d18e0e6fb36424c6547b4ec71902d11c5
3
  size 109009752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27dcec798f401aea531332fd52d47af4e2e2052534e106a38738f74d8310f559
3
  size 109009752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c01ec9d1f8083459f22d7eb7f74be826665564bff8cfff1031d1dd0d4707690e
3
  size 56088788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5f75e289bb3450e55503e27675a790d9ae74e663bd5176ca0036dc79eed1f7f
3
  size 56088788
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75b81576a953c126a70feb1037e15d1536a41145956ed969eb430642c3a082d6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f464ee492959ca51f31ddd6c918f5e6ed3b897ddaa5bd27211176d3e42d4533
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f554738d4c98e192859c545795d9bad33dffcf55dc2610937bb10f054a491a5
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a1a67751ef8c6e878b8ba1ee8cfd48efab59bef2ad58f80bf89ebc2ab37857
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 3.6971795225326787e-07,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-340",
4
- "epoch": 2.28956228956229,
5
  "eval_steps": 20,
6
- "global_step": 340,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -172,6 +172,14 @@
172
  "eval_samples_per_second": 28.424,
173
  "eval_steps_per_second": 0.91,
174
  "step": 340
 
 
 
 
 
 
 
 
175
  }
176
  ],
177
  "logging_steps": 100,
@@ -200,7 +208,7 @@
200
  "attributes": {}
201
  }
202
  },
203
- "total_flos": 1.4357561956368384e+17,
204
  "train_batch_size": 8,
205
  "trial_name": null,
206
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.503983521113696e-07,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-360",
4
+ "epoch": 2.4242424242424243,
5
  "eval_steps": 20,
6
+ "global_step": 360,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
172
  "eval_samples_per_second": 28.424,
173
  "eval_steps_per_second": 0.91,
174
  "step": 340
175
+ },
176
+ {
177
+ "epoch": 2.4242424242424243,
178
+ "eval_loss": 3.503983521113696e-07,
179
+ "eval_runtime": 4.387,
180
+ "eval_samples_per_second": 28.493,
181
+ "eval_steps_per_second": 0.912,
182
+ "step": 360
183
  }
184
  ],
185
  "logging_steps": 100,
 
208
  "attributes": {}
209
  }
210
  },
211
+ "total_flos": 1.5202435039494144e+17,
212
  "train_batch_size": 8,
213
  "trial_name": null,
214
  "trial_params": null