mrferr3t commited on
Commit
7dc1917
·
verified ·
1 Parent(s): bc36c94

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cec129b4f8a0920ac329e841d136fb13fa3a4dac2472fd85bddb6c8aa2c9c35
3
  size 109009752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec8af09ea1ab2375872b62219be9333db29fde1e77fb8983403e001f04945252
3
  size 109009752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a73fac7d3563437a76adbea0f9aedc23cf5ae54325ae15fbd01e23eb98052f6
3
  size 56088148
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3774a20cf58dce6c8704d494e52999ee482552ef6a2990602964e507df389e
3
  size 56088148
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:115f8b8ce45ad51489027f59416f2021c410ae7004969287814b0dde5c3cc44f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35bb90a354ebd23af0a5c0c1246f630c256d6eae0cf735c8f8719f8c325c2b7d
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7df70caaedac0c234c7f5937694a04d6ee70bc0b2ef988bc747140f852d79a1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31da5a14cc904adc54ea83cca79e784b23d086943331be4291a1b3f48fa9a4d1
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 5.0069978897226974e-05,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-20",
4
- "epoch": 0.13468013468013468,
5
  "eval_steps": 20,
6
- "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -23,6 +23,14 @@
23
  "eval_samples_per_second": 28.585,
24
  "eval_steps_per_second": 0.915,
25
  "step": 20
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
  "logging_steps": 100,
@@ -51,7 +59,7 @@
51
  "attributes": {}
52
  }
53
  },
54
- "total_flos": 8448730831257600.0,
55
  "train_batch_size": 8,
56
  "trial_name": null,
57
  "trial_params": null
 
1
  {
2
+ "best_metric": 8.045045433391351e-06,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-40",
4
+ "epoch": 0.26936026936026936,
5
  "eval_steps": 20,
6
+ "global_step": 40,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
23
  "eval_samples_per_second": 28.585,
24
  "eval_steps_per_second": 0.915,
25
  "step": 20
26
+ },
27
+ {
28
+ "epoch": 0.26936026936026936,
29
+ "eval_loss": 8.045045433391351e-06,
30
+ "eval_runtime": 4.3441,
31
+ "eval_samples_per_second": 28.775,
32
+ "eval_steps_per_second": 0.921,
33
+ "step": 40
34
  }
35
  ],
36
  "logging_steps": 100,
 
59
  "attributes": {}
60
  }
61
  },
62
+ "total_flos": 1.68974616625152e+16,
63
  "train_batch_size": 8,
64
  "trial_name": null,
65
  "trial_params": null