File size: 2,183 Bytes
9c6032b
 
 
5de2d54
0567724
5de2d54
9c6032b
 
 
 
 
 
0567724
9c6032b
 
 
 
 
 
 
0567724
 
 
9c6032b
 
 
 
0567724
9c6032b
 
 
 
0567724
 
 
 
 
 
 
 
9c6032b
d0d7d6c
0567724
d0d7d6c
0567724
d0d7d6c
 
 
 
0567724
d0d7d6c
0567724
d0d7d6c
 
 
0567724
 
 
 
 
 
5de2d54
 
 
 
 
 
 
9c6032b
 
 
0567724
9c6032b
 
0567724
9c6032b
 
 
 
 
 
 
5de2d54
9c6032b
 
 
 
5de2d54
9c6032b
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.011927836588638736,
  "eval_steps": 2,
  "global_step": 5,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0023855673177277472,
      "grad_norm": 1.2481120824813843,
      "learning_rate": 1e-05,
      "loss": 0.9265,
      "step": 1
    },
    {
      "epoch": 0.0023855673177277472,
      "eval_loss": 0.9870346188545227,
      "eval_runtime": 65.0919,
      "eval_samples_per_second": 10.846,
      "eval_steps_per_second": 5.423,
      "step": 1
    },
    {
      "epoch": 0.0047711346354554944,
      "grad_norm": 1.427655577659607,
      "learning_rate": 2e-05,
      "loss": 1.0298,
      "step": 2
    },
    {
      "epoch": 0.0047711346354554944,
      "eval_loss": 0.9387862086296082,
      "eval_runtime": 16.6543,
      "eval_samples_per_second": 42.392,
      "eval_steps_per_second": 21.196,
      "step": 2
    },
    {
      "epoch": 0.007156701953183241,
      "grad_norm": 1.2481718063354492,
      "learning_rate": 3e-05,
      "loss": 0.9639,
      "step": 3
    },
    {
      "epoch": 0.009542269270910989,
      "grad_norm": 1.2510924339294434,
      "learning_rate": 4e-05,
      "loss": 0.9506,
      "step": 4
    },
    {
      "epoch": 0.009542269270910989,
      "eval_loss": 0.8984954953193665,
      "eval_runtime": 16.8324,
      "eval_samples_per_second": 41.943,
      "eval_steps_per_second": 20.971,
      "step": 4
    },
    {
      "epoch": 0.011927836588638736,
      "grad_norm": 1.215053677558899,
      "learning_rate": 5e-05,
      "loss": 0.8298,
      "step": 5
    }
  ],
  "logging_steps": 1,
  "max_steps": 5,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 2,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 3295645846732800.0,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}