mrferr3t commited on
Commit
19d2efd
·
verified ·
1 Parent(s): 661c2de

Training in progress, step 258, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8e00f795373d48fe700f3ac538f1e6d917f657c2991866baedbe4e97016442d
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7642ab38cc4d0ac27666134eef25f6c939e09eff7de2f2a5046f957d09102f5a
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27e19611464de0f4881682ee88217089320bf712b39dad09f36dceb911be8b94
3
- size 43122580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c34e65ccc0893f3f3201d4a3301526f6e4e030e855c54408dc5be073adb6686d
3
+ size 43123028
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1de20a5cd3c88682fc5b2bee85dd4db1a9c7684b18bea5f60553dccb8e074f2c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b536e9b95d89439a3272f61cd2b9c84ddc6a9f0549c2b6fbdf7508ca48a0bca
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ac80c0099741497605b86b89633b368aa3c621dc73b66fb8d88b5b18259b2d6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de60b07a925742ae141dd83d6368ce8ec8048f752fbd50a4e436245ca25d81ac
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.44831588864326477,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-215",
4
- "epoch": 0.6643491695635381,
5
  "eval_steps": 43,
6
- "global_step": 215,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -90,6 +90,21 @@
90
  "eval_samples_per_second": 21.424,
91
  "eval_steps_per_second": 1.35,
92
  "step": 215
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
93
  }
94
  ],
95
  "logging_steps": 43,
@@ -118,7 +133,7 @@
118
  "attributes": {}
119
  }
120
  },
121
- "total_flos": 1.1290711730537103e+18,
122
  "train_batch_size": 16,
123
  "trial_name": null,
124
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.44344472885131836,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-258",
4
+ "epoch": 0.7972190034762456,
5
  "eval_steps": 43,
6
+ "global_step": 258,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
90
  "eval_samples_per_second": 21.424,
91
  "eval_steps_per_second": 1.35,
92
  "step": 215
93
+ },
94
+ {
95
+ "epoch": 0.7972190034762456,
96
+ "grad_norm": 3.9321422576904297,
97
+ "learning_rate": 0.00039997623742088825,
98
+ "loss": 3.5561,
99
+ "step": 258
100
+ },
101
+ {
102
+ "epoch": 0.7972190034762456,
103
+ "eval_loss": 0.44344472885131836,
104
+ "eval_runtime": 70.4613,
105
+ "eval_samples_per_second": 21.615,
106
+ "eval_steps_per_second": 1.362,
107
+ "step": 258
108
  }
109
  ],
110
  "logging_steps": 43,
 
133
  "attributes": {}
134
  }
135
  },
136
+ "total_flos": 1.3502583541145272e+18,
137
  "train_batch_size": 16,
138
  "trial_name": null,
139
  "trial_params": null