lesso08 commited on
Commit
5ebc452
·
verified ·
1 Parent(s): 1132b20

Training in progress, step 150, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f326f334eef37db7e81d1bdc92c8688331a0abc7cc3fb88f688626369d739878
3
  size 639691872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d7e4a616242a8ccbeb438b98421f0be481edb7bd3dfaa3fa392b185e18f7c0c
3
  size 639691872
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcb7967971c95e1cb3bec161bb5c36617b4c72d2f099ade3d966881a7c490888
3
  size 325339796
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5944558899ef544bfa4ed171cf2546f64d41350e01d53000113a170c27ff2146
3
  size 325339796
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25eaed32035452f61b530f05ddb1757ce562ec2a5b996368ee4ed21c4aef9551
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb60a6ffe8ef9e5fce9d63efc6be2357546fb0493004894178b1ab2ce90cf914
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27d9d26262db0192551c63e8e2cb503f12fb8cb162ff6ce7f18ac6f7e9d328d6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:662c9e898ac39a71b423a2785b52925d7ca06517ad79ef8a45be543246b1a1b6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.273123025894165,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-50",
4
- "epoch": 0.006518267444513249,
5
  "eval_steps": 50,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -101,6 +101,49 @@
101
  "eval_samples_per_second": 14.474,
102
  "eval_steps_per_second": 3.619,
103
  "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
104
  }
105
  ],
106
  "logging_steps": 10,
@@ -115,7 +158,7 @@
115
  "early_stopping_threshold": 0.0
116
  },
117
  "attributes": {
118
- "early_stopping_patience_counter": 1
119
  }
120
  },
121
  "TrainerControl": {
@@ -129,7 +172,7 @@
129
  "attributes": {}
130
  }
131
  },
132
- "total_flos": 2.0633874937675776e+16,
133
  "train_batch_size": 4,
134
  "trial_name": null,
135
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.1874332427978516,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-150",
4
+ "epoch": 0.009777401166769872,
5
  "eval_steps": 50,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
101
  "eval_samples_per_second": 14.474,
102
  "eval_steps_per_second": 3.619,
103
  "step": 100
104
+ },
105
+ {
106
+ "epoch": 0.007170094188964573,
107
+ "grad_norm": 2.3844895362854004,
108
+ "learning_rate": 0.00019900872759483047,
109
+ "loss": 1.0244,
110
+ "step": 110
111
+ },
112
+ {
113
+ "epoch": 0.007821920933415898,
114
+ "grad_norm": 2.4352855682373047,
115
+ "learning_rate": 0.0001958265496573284,
116
+ "loss": 1.1891,
117
+ "step": 120
118
+ },
119
+ {
120
+ "epoch": 0.008473747677867223,
121
+ "grad_norm": 3.231959819793701,
122
+ "learning_rate": 0.00019219700200026827,
123
+ "loss": 1.2308,
124
+ "step": 130
125
+ },
126
+ {
127
+ "epoch": 0.009125574422318547,
128
+ "grad_norm": 2.5154852867126465,
129
+ "learning_rate": 0.0001881377674149945,
130
+ "loss": 1.2077,
131
+ "step": 140
132
+ },
133
+ {
134
+ "epoch": 0.009777401166769872,
135
+ "grad_norm": 3.0093817710876465,
136
+ "learning_rate": 0.00018366862208437368,
137
+ "loss": 1.3988,
138
+ "step": 150
139
+ },
140
+ {
141
+ "epoch": 0.009777401166769872,
142
+ "eval_loss": 1.1874332427978516,
143
+ "eval_runtime": 447.657,
144
+ "eval_samples_per_second": 14.431,
145
+ "eval_steps_per_second": 3.608,
146
+ "step": 150
147
  }
148
  ],
149
  "logging_steps": 10,
 
158
  "early_stopping_threshold": 0.0
159
  },
160
  "attributes": {
161
+ "early_stopping_patience_counter": 0
162
  }
163
  },
164
  "TrainerControl": {
 
172
  "attributes": {}
173
  }
174
  },
175
+ "total_flos": 3.128632256810189e+16,
176
  "train_batch_size": 4,
177
  "trial_name": null,
178
  "trial_params": null