mrferr3t commited on
Commit
2420bcf
·
verified ·
1 Parent(s): a6785df

Training in progress, step 80, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbec2fd4afd82e2174d8e90843450aa9cfec17114609e0daaec109e20feb58b9
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76a97a1e96f8482415c65bd89a97b0c8bef1f0ba36491dc5c791eb6383fb2c93
3
  size 5752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bdef43d2b373c43f94b1dfcbd9016d90a7c196769b7519c0951291dc44b8ca91
3
  size 15814
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154c4e79ae0c1642bec0689b387f356f510f9f2125163f429d2f1e99318872a4
3
  size 15814
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ae59499d6fa89d93656a32994352236f76ecdb3c0d5d7d01bbf5e497aa8ee6c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642f45901353083874dd4ccdc81e607e878e0b3cdd199252b432047c32c37076
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:066ba65f4953fa1b75b645f57a930b28fbba82ba12586f9907c767ebd5948500
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f80e8870b8e62250be6500873da286447839553cb3b0143c2f041e1ffce40d01
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 11.5,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-20",
4
- "epoch": 0.5687203791469194,
5
  "eval_steps": 20,
6
- "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -39,6 +39,14 @@
39
  "eval_samples_per_second": 167.381,
40
  "eval_steps_per_second": 5.478,
41
  "step": 60
 
 
 
 
 
 
 
 
42
  }
43
  ],
44
  "logging_steps": 100,
@@ -53,7 +61,7 @@
53
  "early_stopping_threshold": 0.0
54
  },
55
  "attributes": {
56
- "early_stopping_patience_counter": 1
57
  }
58
  },
59
  "TrainerControl": {
@@ -67,7 +75,7 @@
67
  "attributes": {}
68
  }
69
  },
70
- "total_flos": 31876605542400.0,
71
  "train_batch_size": 64,
72
  "trial_name": null,
73
  "trial_params": null
 
1
  {
2
  "best_metric": 11.5,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-20",
4
+ "epoch": 0.7582938388625592,
5
  "eval_steps": 20,
6
+ "global_step": 80,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
39
  "eval_samples_per_second": 167.381,
40
  "eval_steps_per_second": 5.478,
41
  "step": 60
42
+ },
43
+ {
44
+ "epoch": 0.7582938388625592,
45
+ "eval_loss": 11.5,
46
+ "eval_runtime": 1.0634,
47
+ "eval_samples_per_second": 258.61,
48
+ "eval_steps_per_second": 8.464,
49
+ "step": 80
50
  }
51
  ],
52
  "logging_steps": 100,
 
61
  "early_stopping_threshold": 0.0
62
  },
63
  "attributes": {
64
+ "early_stopping_patience_counter": 2
65
  }
66
  },
67
  "TrainerControl": {
 
75
  "attributes": {}
76
  }
77
  },
78
+ "total_flos": 38251926650880.0,
79
  "train_batch_size": 64,
80
  "trial_name": null,
81
  "trial_params": null