Training in progress, epoch 2, checkpoint
Browse files- checkpoint-204/adapter_config.json +3 -3
- checkpoint-204/adapter_model.safetensors +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/global_step204/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +1 -1
- checkpoint-204/trainer_state.json +3 -3
- checkpoint-204/training_args.bin +1 -1
- checkpoint-204/value_head.safetensors +1 -1
checkpoint-204/adapter_config.json
CHANGED
@@ -20,12 +20,12 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
"k_proj",
|
25 |
-
"
|
26 |
"o_proj",
|
|
|
27 |
"q_proj",
|
28 |
-
"v_proj",
|
29 |
"gate_proj"
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"v_proj",
|
24 |
"k_proj",
|
25 |
+
"down_proj",
|
26 |
"o_proj",
|
27 |
+
"up_proj",
|
28 |
"q_proj",
|
|
|
29 |
"gate_proj"
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
checkpoint-204/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 207244392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7950acbc43ed0e0db3b2c769dcf4f612bad07d3d7165a99f8ce3ba6829396ccd
|
3 |
size 207244392
|
checkpoint-204/global_step204/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6edce4ca7fe812355ca3e4092c6ced42ac99f25c6d6bbcf363356610e6beb35a
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cb70de3fe8006e99b07340989aa3016dd20d6a382ca92c2f29b7031fa575d09
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e14dc81e5dfca2d1d7e4d1afaf131bd0af0be488bb1d560e6d66d55d734dce16
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb1f41c0898618a95f1d01d042daf4df5b5fec8b7f6c4914455a63560aabad0b
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbdb355e0f70485e95d3f883a1ece675972a403b3664a071563d39b84bc68f7a
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d60c8c5bf285033185315740e7bf96d22d72392106ea54184aaf873dc4d6fa71
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1627f6c69c4736bbc7b343bc46d454160e09a134725728417c8bbfbea2a02e7a
|
3 |
size 19421232
|
checkpoint-204/global_step204/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 19421232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2f4ef1ef43a43029a1874797cbd244de506cb1e0fde84ec12c41d1c28761b0
|
3 |
size 19421232
|
checkpoint-204/trainer_state.json
CHANGED
@@ -10,16 +10,16 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9803921568627451,
|
13 |
-
"grad_norm": 0.
|
14 |
"learning_rate": 3.9722621383652286e-05,
|
15 |
"loss": 0.3224,
|
16 |
"step": 100
|
17 |
},
|
18 |
{
|
19 |
"epoch": 1.9607843137254903,
|
20 |
-
"grad_norm": 0.
|
21 |
"learning_rate": 3.816756982694638e-05,
|
22 |
-
"loss": 0.
|
23 |
"step": 200
|
24 |
}
|
25 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9803921568627451,
|
13 |
+
"grad_norm": 0.041187554597854614,
|
14 |
"learning_rate": 3.9722621383652286e-05,
|
15 |
"loss": 0.3224,
|
16 |
"step": 100
|
17 |
},
|
18 |
{
|
19 |
"epoch": 1.9607843137254903,
|
20 |
+
"grad_norm": 0.05797708407044411,
|
21 |
"learning_rate": 3.816756982694638e-05,
|
22 |
+
"loss": 0.2134,
|
23 |
"step": 200
|
24 |
}
|
25 |
],
|
checkpoint-204/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e85267171c46dc1c3303c31870ee78028f6f93ce2789cc5b73fc96c18746b9e2
|
3 |
size 7352
|
checkpoint-204/value_head.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 16586
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd5ac2d39ad6e5cb6f2926524d26556a10b303be659e2967ae3d930d2ec5b0d4
|
3 |
size 16586
|