File size: 2,183 Bytes
9c6032b 5de2d54 0567724 5de2d54 9c6032b 0567724 9c6032b 0567724 9c6032b 0567724 9c6032b 0567724 9c6032b d0d7d6c 0567724 d0d7d6c 0567724 d0d7d6c 0567724 d0d7d6c 0567724 d0d7d6c 0567724 5de2d54 9c6032b 0567724 9c6032b 0567724 9c6032b 5de2d54 9c6032b 5de2d54 9c6032b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.011927836588638736,
"eval_steps": 2,
"global_step": 5,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0023855673177277472,
"grad_norm": 1.2481120824813843,
"learning_rate": 1e-05,
"loss": 0.9265,
"step": 1
},
{
"epoch": 0.0023855673177277472,
"eval_loss": 0.9870346188545227,
"eval_runtime": 65.0919,
"eval_samples_per_second": 10.846,
"eval_steps_per_second": 5.423,
"step": 1
},
{
"epoch": 0.0047711346354554944,
"grad_norm": 1.427655577659607,
"learning_rate": 2e-05,
"loss": 1.0298,
"step": 2
},
{
"epoch": 0.0047711346354554944,
"eval_loss": 0.9387862086296082,
"eval_runtime": 16.6543,
"eval_samples_per_second": 42.392,
"eval_steps_per_second": 21.196,
"step": 2
},
{
"epoch": 0.007156701953183241,
"grad_norm": 1.2481718063354492,
"learning_rate": 3e-05,
"loss": 0.9639,
"step": 3
},
{
"epoch": 0.009542269270910989,
"grad_norm": 1.2510924339294434,
"learning_rate": 4e-05,
"loss": 0.9506,
"step": 4
},
{
"epoch": 0.009542269270910989,
"eval_loss": 0.8984954953193665,
"eval_runtime": 16.8324,
"eval_samples_per_second": 41.943,
"eval_steps_per_second": 20.971,
"step": 4
},
{
"epoch": 0.011927836588638736,
"grad_norm": 1.215053677558899,
"learning_rate": 5e-05,
"loss": 0.8298,
"step": 5
}
],
"logging_steps": 1,
"max_steps": 5,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 2,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 3295645846732800.0,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|