lesso02 commited on
Commit
3dd00ba
·
verified ·
1 Parent(s): bd8a413

End of training

Browse files
README.md CHANGED
@@ -103,7 +103,7 @@ xformers_attention: true
103
 
104
  This model is a fine-tuned version of [katuni4ka/tiny-random-olmo-hf](https://huggingface.co/katuni4ka/tiny-random-olmo-hf) on the None dataset.
105
  It achieves the following results on the evaluation set:
106
- - Loss: 10.7643
107
 
108
  ## Model description
109
 
@@ -140,7 +140,7 @@ The following hyperparameters were used during training:
140
 
141
  | Training Loss | Epoch | Step | Validation Loss |
142
  |:-------------:|:------:|:----:|:---------------:|
143
- | 10.7739 | 0.2486 | 200 | 10.7643 |
144
 
145
 
146
  ### Framework versions
 
103
 
104
  This model is a fine-tuned version of [katuni4ka/tiny-random-olmo-hf](https://huggingface.co/katuni4ka/tiny-random-olmo-hf) on the None dataset.
105
  It achieves the following results on the evaluation set:
106
+ - Loss: 10.7765
107
 
108
  ## Model description
109
 
 
140
 
141
  | Training Loss | Epoch | Step | Validation Loss |
142
  |:-------------:|:------:|:----:|:---------------:|
143
+ | 10.7855 | 0.2486 | 200 | 10.7765 |
144
 
145
 
146
  ### Framework versions
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "o_proj",
24
- "gate_proj",
25
  "v_proj",
 
 
26
  "q_proj",
27
  "k_proj",
28
- "down_proj",
29
- "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "down_proj",
 
24
  "v_proj",
25
+ "up_proj",
26
+ "o_proj",
27
  "q_proj",
28
  "k_proj",
29
+ "gate_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df4eb4790f1cc1f386551822ab48462af5ec8030cc5d38e4d0ec38a6a4c8480c
3
  size 88194
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ef00d28cf40b491e3e26f50f3422d23b3067becbed87ffdaaf79187c1a4af88
3
  size 88194
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fcce4f8c559d53daa1856dfc12c9ee0d7c7938d995362b7374d124699259ec4
3
  size 81576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af7e25e931ca43a953d52e69cb97e18e40333c9b5b417f4649269df6507b9d2
3
  size 81576
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22c13bcd1d2c0e3f1a4e62897f39b48d1e64a2c11f728cb1e66d23224cb9626b
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075d98fa3241942aabecd23aaec2ebe0171706d659f62ddb451527855f8e9edf
3
  size 6776