mrferr3t commited on
Commit
f92323b
·
verified ·
1 Parent(s): 767a05d

Training in progress, step 340, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0096943c56e6d5c858199f3d20e43a66545cfafbb05dac5dd43a4f00ef99a118
3
  size 109009752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7384e6e0afd8f05180f65c96007714d18e0e6fb36424c6547b4ec71902d11c5
3
  size 109009752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aae87e246941bbd07ed034fc4fce008471a5a64f84952a0a68d077c2c4799647
3
  size 56088788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c01ec9d1f8083459f22d7eb7f74be826665564bff8cfff1031d1dd0d4707690e
3
  size 56088788
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be951e35134e38a25ddb549895edf56032d2fadab85e0bd34febb4e424907c3a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75b81576a953c126a70feb1037e15d1536a41145956ed969eb430642c3a082d6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f23adcb0ffe9f4db397db4bf9a51186d6924cf27594d2ce31102b42ec188074
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f554738d4c98e192859c545795d9bad33dffcf55dc2610937bb10f054a491a5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 3.925752878330968e-07,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-320",
4
- "epoch": 2.154882154882155,
5
  "eval_steps": 20,
6
- "global_step": 320,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -164,6 +164,14 @@
164
  "eval_samples_per_second": 28.562,
165
  "eval_steps_per_second": 0.914,
166
  "step": 320
 
 
 
 
 
 
 
 
167
  }
168
  ],
169
  "logging_steps": 100,
@@ -192,7 +200,7 @@
192
  "attributes": {}
193
  }
194
  },
195
- "total_flos": 1.3512688873242624e+17,
196
  "train_batch_size": 8,
197
  "trial_name": null,
198
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.6971795225326787e-07,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-340",
4
+ "epoch": 2.28956228956229,
5
  "eval_steps": 20,
6
+ "global_step": 340,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
164
  "eval_samples_per_second": 28.562,
165
  "eval_steps_per_second": 0.914,
166
  "step": 320
167
+ },
168
+ {
169
+ "epoch": 2.28956228956229,
170
+ "eval_loss": 3.6971795225326787e-07,
171
+ "eval_runtime": 4.3977,
172
+ "eval_samples_per_second": 28.424,
173
+ "eval_steps_per_second": 0.91,
174
+ "step": 340
175
  }
176
  ],
177
  "logging_steps": 100,
 
200
  "attributes": {}
201
  }
202
  },
203
+ "total_flos": 1.4357561956368384e+17,
204
  "train_batch_size": 8,
205
  "trial_name": null,
206
  "trial_params": null