Upload folder using huggingface_hub
Browse files- config.json +2 -2
- generation_config.json +1 -1
- model-00001-of-00015.safetensors +1 -1
- model-00002-of-00015.safetensors +1 -1
- model-00003-of-00015.safetensors +1 -1
- model-00004-of-00015.safetensors +1 -1
- model-00005-of-00015.safetensors +1 -1
- model-00006-of-00015.safetensors +1 -1
- model-00007-of-00015.safetensors +1 -1
- model-00008-of-00015.safetensors +1 -1
- model-00009-of-00015.safetensors +1 -1
- model-00010-of-00015.safetensors +1 -1
- model-00011-of-00015.safetensors +1 -1
- model-00012-of-00015.safetensors +1 -1
- model-00013-of-00015.safetensors +1 -1
- model-00014-of-00015.safetensors +1 -1
- model-00015-of-00015.safetensors +1 -1
- recipe.yaml +12 -2
config.json
CHANGED
@@ -47,7 +47,7 @@
|
|
47 |
"quantization_status": "frozen",
|
48 |
"sparsity_config": {
|
49 |
"format": "dense",
|
50 |
-
"global_sparsity": 2.
|
51 |
"registry_requires_subclass": false,
|
52 |
"sparsity_structure": "unstructured"
|
53 |
}
|
@@ -79,7 +79,7 @@
|
|
79 |
"rope_theta": 500000.0,
|
80 |
"tie_word_embeddings": false,
|
81 |
"torch_dtype": "bfloat16",
|
82 |
-
"transformers_version": "4.43.
|
83 |
"use_cache": true,
|
84 |
"vocab_size": 128256
|
85 |
}
|
|
|
47 |
"quantization_status": "frozen",
|
48 |
"sparsity_config": {
|
49 |
"format": "dense",
|
50 |
+
"global_sparsity": 2.0350219291192033,
|
51 |
"registry_requires_subclass": false,
|
52 |
"sparsity_structure": "unstructured"
|
53 |
}
|
|
|
79 |
"rope_theta": 500000.0,
|
80 |
"tie_word_embeddings": false,
|
81 |
"torch_dtype": "bfloat16",
|
82 |
+
"transformers_version": "4.43.3",
|
83 |
"use_cache": true,
|
84 |
"vocab_size": 128256
|
85 |
}
|
generation_config.json
CHANGED
@@ -6,5 +6,5 @@
|
|
6 |
128008,
|
7 |
128009
|
8 |
],
|
9 |
-
"transformers_version": "4.43.
|
10 |
}
|
|
|
6 |
128008,
|
7 |
128009
|
8 |
],
|
9 |
+
"transformers_version": "4.43.3"
|
10 |
}
|
model-00001-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4819900928
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11414693dd88807a2cc34159e92c2f98b0060ad12bbcb853341f740780dd2b5d
|
3 |
size 4819900928
|
model-00002-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984010360
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ffa38ea00dd7b9337441231c30a840201057dffee3ffb3df7031ecbb2a11c16
|
3 |
size 4984010360
|
model-00003-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900112536
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bf94685a5adf09a38035e54c2bfbaba872ebec426bb2aa02e76bf5a00f2b9a3
|
3 |
size 4900112536
|
model-00004-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1abde96cfe492fc47303c5d54f7af9d32dc0b80c0814b1934e58f5c280606938
|
3 |
size 4900104584
|
model-00005-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09db1268e643ac958c5d340e7629ea8d2664c22bc5b63f919130642214269d8a
|
3 |
size 4900104584
|
model-00006-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984010448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e285e7ab13a54a0d3723cd3e39c7a0ad21f066c425e2123b6e23bfe3c29eca4
|
3 |
size 4984010448
|
model-00007-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900112552
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45836d673a45a7b336ab9eecf17d6b50264e62d61d15d1161d6edf4152fc35db
|
3 |
size 4900112552
|
model-00008-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb7cb74df9582c752075c28e9de6147c4cff1967585cb2d90e392399af53aa3c
|
3 |
size 4900104584
|
model-00009-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c8d6bc4fe62197d4b933910140420b9b457444d91daa1b609ca0c2dfca7910a
|
3 |
size 4900104584
|
model-00010-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984010448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29ca07e2a2084e98a3e7d05b361721ed4d4b71ebf07a5a565d37de69c3f14348
|
3 |
size 4984010448
|
model-00011-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900112552
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:996d4539fcd59d7bca288c2d64221ba6359b8275ba2d595511a10c105a5b812d
|
3 |
size 4900112552
|
model-00012-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ee5cb9888eb4cfb7685184267e04c971766f79fc4cb5f974bfe70777f10f9fe
|
3 |
size 4900104584
|
model-00013-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4900104584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e495362d49634554dee2b498f7eca1dcd0c4bb7bf48d6145098f260e203042a
|
3 |
size 4900104584
|
model-00014-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984010448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e202bcf3246adf2d3223fa964ff489774a4a36a5fb5df01e32393f0c4e89c94
|
3 |
size 4984010448
|
model-00015-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3813044096
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6774db5aae488ddcd66cff453787a1481198d4a4b85cce3fc12d9e5e8bf5f621
|
3 |
size 3813044096
|
recipe.yaml
CHANGED
@@ -1,8 +1,18 @@
|
|
1 |
quant_stage:
|
2 |
quant_modifiers:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
GPTQModifier:
|
4 |
sequential_update: false
|
5 |
-
dampening_frac: 0.
|
6 |
ignore: [lm_head]
|
7 |
scheme: W8A8
|
8 |
-
targets: Linear
|
|
|
|
1 |
quant_stage:
|
2 |
quant_modifiers:
|
3 |
+
SmoothQuantModifier:
|
4 |
+
smoothing_strength: 0.7
|
5 |
+
mappings:
|
6 |
+
- - ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj']
|
7 |
+
- re:.*input_layernorm
|
8 |
+
- - ['re:.*gate_proj', 're:.*up_proj']
|
9 |
+
- re:.*post_attention_layernorm
|
10 |
+
- - ['re:.*down_proj']
|
11 |
+
- re:.*up_proj
|
12 |
GPTQModifier:
|
13 |
sequential_update: false
|
14 |
+
dampening_frac: 0.2
|
15 |
ignore: [lm_head]
|
16 |
scheme: W8A8
|
17 |
+
targets: [Linear]
|
18 |
+
observer: mse
|