Training in progress, step 500
Browse files- adapter_config.json +8 -15
- adapter_model.safetensors +2 -2
- runs/Jan11_09-59-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704934788.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.0 +2 -2
- runs/Jan11_13-19-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946761.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.1 +3 -0
- runs/Jan11_13-20-25_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946826.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.2 +3 -0
- runs/Jan11_13-28-32_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947312.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.3 +3 -0
- runs/Jan11_13-34-05_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947646.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.4 +3 -0
- runs/Jan11_13-35-03_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947703.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.5 +3 -0
- runs/Jan11_13-36-00_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947760.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1955.0 +3 -0
- runs/Jan11_13-37-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947869.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2149.0 +3 -0
- runs/Jan11_13-38-52_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947932.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2358.0 +3 -0
- runs/Jan11_13-41-46_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948107.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.0 +3 -0
- runs/Jan11_13-44-53_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948294.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.1 +3 -0
- training_args.bin +1 -1
adapter_config.json
CHANGED
@@ -1,26 +1,19 @@
|
|
1 |
{
|
2 |
-
"alpha_pattern": {},
|
3 |
"auto_mapping": null,
|
4 |
"base_model_name_or_path": "bert-base-cased",
|
5 |
-
"bias": "all",
|
6 |
"fan_in_fan_out": false,
|
|
|
|
|
|
|
7 |
"inference_mode": true,
|
8 |
-
"
|
9 |
-
"layers_pattern": null,
|
10 |
-
"layers_to_transform": null,
|
11 |
-
"loftq_config": {},
|
12 |
-
"lora_alpha": 16,
|
13 |
-
"lora_dropout": 0.1,
|
14 |
-
"megatron_config": null,
|
15 |
-
"megatron_core": "megatron.core",
|
16 |
"modules_to_save": null,
|
17 |
-
"peft_type": "
|
18 |
-
"r": 16,
|
19 |
-
"rank_pattern": {},
|
20 |
"revision": null,
|
21 |
"target_modules": [
|
22 |
-
"
|
23 |
-
"value"
|
|
|
24 |
],
|
25 |
"task_type": "QUESTION_ANS"
|
26 |
}
|
|
|
1 |
{
|
|
|
2 |
"auto_mapping": null,
|
3 |
"base_model_name_or_path": "bert-base-cased",
|
|
|
4 |
"fan_in_fan_out": false,
|
5 |
+
"feedforward_modules": [
|
6 |
+
"output.dense"
|
7 |
+
],
|
8 |
"inference_mode": true,
|
9 |
+
"init_ia3_weights": true,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
"modules_to_save": null,
|
11 |
+
"peft_type": "IA3",
|
|
|
|
|
12 |
"revision": null,
|
13 |
"target_modules": [
|
14 |
+
"key",
|
15 |
+
"value",
|
16 |
+
"output.dense"
|
17 |
],
|
18 |
"task_type": "QUESTION_ANS"
|
19 |
}
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac6a7276c3d71ffe7d902b46bf55d42406c9eded1cc69c35a8fa2273134fc34b
|
3 |
+
size 270552
|
runs/Jan11_09-59-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704934788.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b87e578bd8956e50c86cabeecdae0a1d3dd6f9ac21c475a9815cc7a0f3bfdc1
|
3 |
+
size 10553
|
runs/Jan11_13-19-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946761.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9fa68026b467cf86770c837dce71ed54962c2d57fbfdd7dbb860ecad2d2e466
|
3 |
+
size 4336
|
runs/Jan11_13-20-25_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946826.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3894724e7d1e6f81b80216e9ea7d41b5c96e8f368b070bc0a153f2fcab065516
|
3 |
+
size 4336
|
runs/Jan11_13-28-32_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947312.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dcd1748ebc9fe6a240163d6f3073bf9a8989bb99cd8d9c2474dbee96199162b
|
3 |
+
size 4451
|
runs/Jan11_13-34-05_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947646.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec37afa3cadd4617afd374fc0c318fdc93b520cda418bfc13e4d24bd3f5322ea
|
3 |
+
size 4451
|
runs/Jan11_13-35-03_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947703.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4f6ae78394d1ef195724ff3f5e05a7509a87233dfa37517f461bbbaa970f490
|
3 |
+
size 4451
|
runs/Jan11_13-36-00_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947760.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1955.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f22f604782250294343a87c28cbf08175caecb01f0b0c4d989ffccfd98cecc89
|
3 |
+
size 4451
|
runs/Jan11_13-37-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947869.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2149.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f101e590874dbf4d4f6168929c84cbc423c4d1555d345be6adfdc68528e0b00
|
3 |
+
size 4451
|
runs/Jan11_13-38-52_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947932.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2358.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:844c7bdb93b2323cad9699f35f409d015ae406343a4c30515dd1852c41c669b6
|
3 |
+
size 4336
|
runs/Jan11_13-41-46_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948107.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bbc07022defd3ea68538326ad52650956172d055d237346cc402c3eed7bdd27
|
3 |
+
size 4336
|
runs/Jan11_13-44-53_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948294.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04e14b80c0a9b714208b195f346d648301623ddb7231d6330f76eb6669ab3968
|
3 |
+
size 4493
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4283
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e766edabd30f1a08758087e8f308ec60ed7ca8908798d6eb95ca8e3d31366ef8
|
3 |
size 4283
|