Cheng98 commited on
Commit
3ef7528
·
verified ·
1 Parent(s): 4d085c2

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7614678899082569
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [bert-large-cased](https://huggingface.co/bert-large-cased) on the GLUE BOOLQ dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 1.4013
36
- - Accuracy: 0.7615
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7189602446483181
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [bert-large-cased](https://huggingface.co/bert-large-cased) on the GLUE BOOLQ dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 1.4813
36
+ - Accuracy: 0.7190
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.7614678899082569,
4
- "eval_loss": 1.4013047218322754,
5
- "eval_runtime": 18.9743,
6
  "eval_samples": 3270,
7
- "eval_samples_per_second": 172.338,
8
- "eval_steps_per_second": 21.555,
9
- "train_loss": 0.2978504161511437,
10
- "train_runtime": 903.0769,
11
  "train_samples": 9427,
12
- "train_samples_per_second": 52.194,
13
- "train_steps_per_second": 3.267
14
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.7189602446483181,
4
+ "eval_loss": 1.4812861680984497,
5
+ "eval_runtime": 8.4911,
6
  "eval_samples": 3270,
7
+ "eval_samples_per_second": 385.11,
8
+ "eval_steps_per_second": 48.168,
9
+ "train_loss": 0.4028913801807468,
10
+ "train_runtime": 280.0096,
11
  "train_samples": 9427,
12
+ "train_samples_per_second": 168.334,
13
+ "train_steps_per_second": 10.535
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.7614678899082569,
4
- "eval_loss": 1.4013047218322754,
5
- "eval_runtime": 18.9743,
6
  "eval_samples": 3270,
7
- "eval_samples_per_second": 172.338,
8
- "eval_steps_per_second": 21.555
9
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.7189602446483181,
4
+ "eval_loss": 1.4812861680984497,
5
+ "eval_runtime": 8.4911,
6
  "eval_samples": 3270,
7
+ "eval_samples_per_second": 385.11,
8
+ "eval_steps_per_second": 48.168
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0ec95a4b3937605fad0b985e01db5f4aa0bb926328fe878000eb9136e2fda27
3
  size 1334459697
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09c8e05d048133b004a7dfacbc2dd0d6788a99fde3c2ceedce26adfc3da5bf7b
3
  size 1334459697
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.2978504161511437,
4
- "train_runtime": 903.0769,
5
  "train_samples": 9427,
6
- "train_samples_per_second": 52.194,
7
- "train_steps_per_second": 3.267
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.4028913801807468,
4
+ "train_runtime": 280.0096,
5
  "train_samples": 9427,
6
+ "train_samples_per_second": 168.334,
7
+ "train_steps_per_second": 10.535
8
  }
trainer_state.json CHANGED
@@ -9,42 +9,42 @@
9
  "log_history": [
10
  {
11
  "epoch": 0.85,
12
- "learning_rate": 1.6610169491525424e-05,
13
- "loss": 0.6459,
14
  "step": 500
15
  },
16
  {
17
  "epoch": 1.69,
18
- "learning_rate": 1.3220338983050848e-05,
19
- "loss": 0.4886,
20
  "step": 1000
21
  },
22
  {
23
  "epoch": 2.54,
24
- "learning_rate": 9.830508474576272e-06,
25
- "loss": 0.292,
26
  "step": 1500
27
  },
28
  {
29
  "epoch": 3.39,
30
- "learning_rate": 6.440677966101695e-06,
31
- "loss": 0.1704,
32
  "step": 2000
33
  },
34
  {
35
  "epoch": 4.24,
36
- "learning_rate": 3.0508474576271192e-06,
37
- "loss": 0.1074,
38
  "step": 2500
39
  },
40
  {
41
  "epoch": 5.0,
42
  "step": 2950,
43
  "total_flos": 1.098164620261632e+16,
44
- "train_loss": 0.2978504161511437,
45
- "train_runtime": 903.0769,
46
- "train_samples_per_second": 52.194,
47
- "train_steps_per_second": 3.267
48
  }
49
  ],
50
  "max_steps": 2950,
 
9
  "log_history": [
10
  {
11
  "epoch": 0.85,
12
+ "learning_rate": 1.663050847457627e-05,
13
+ "loss": 0.6703,
14
  "step": 500
15
  },
16
  {
17
  "epoch": 1.69,
18
+ "learning_rate": 1.3247457627118644e-05,
19
+ "loss": 0.6156,
20
  "step": 1000
21
  },
22
  {
23
  "epoch": 2.54,
24
+ "learning_rate": 9.857627118644068e-06,
25
+ "loss": 0.4724,
26
  "step": 1500
27
  },
28
  {
29
  "epoch": 3.39,
30
+ "learning_rate": 6.4677966101694925e-06,
31
+ "loss": 0.317,
32
  "step": 2000
33
  },
34
  {
35
  "epoch": 4.24,
36
+ "learning_rate": 3.0847457627118648e-06,
37
+ "loss": 0.1946,
38
  "step": 2500
39
  },
40
  {
41
  "epoch": 5.0,
42
  "step": 2950,
43
  "total_flos": 1.098164620261632e+16,
44
+ "train_loss": 0.4028913801807468,
45
+ "train_runtime": 280.0096,
46
+ "train_samples_per_second": 168.334,
47
+ "train_steps_per_second": 10.535
48
  }
49
  ],
50
  "max_steps": 2950,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:533f3a1d23e99ef6bafd35a0187598e54d91a38adf59eea1381eac16b380fe56
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cc5a4b111de42d82d2e0312fc3660c44a2822aa287d7173e3e06d983bcc309c
3
  size 3963