Upload 150 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +76 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 131072,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": 1024000,
|
16 |
+
"sliding_window_size": -1,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80
|
21 |
+
},
|
22 |
+
"vocab_size": 131072,
|
23 |
+
"context_window_size": 1024000,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.json",
|
36 |
+
"tokenizer_config.json"
|
37 |
+
],
|
38 |
+
"tokenizer_info": {
|
39 |
+
"token_postproc_method": "byte_level",
|
40 |
+
"prepend_space_in_encode": false,
|
41 |
+
"strip_space_in_decode": false
|
42 |
+
},
|
43 |
+
"conv_template": {
|
44 |
+
"name": "chatml",
|
45 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
46 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
47 |
+
"system_prefix_token_ids": null,
|
48 |
+
"add_role_after_system_message": true,
|
49 |
+
"roles": {
|
50 |
+
"user": "<|im_start|>user",
|
51 |
+
"assistant": "<|im_start|>assistant"
|
52 |
+
},
|
53 |
+
"role_templates": {
|
54 |
+
"user": "{user_message}",
|
55 |
+
"assistant": "{assistant_message}",
|
56 |
+
"tool": "{tool_message}"
|
57 |
+
},
|
58 |
+
"messages": [],
|
59 |
+
"seps": [
|
60 |
+
"<|im_end|>\n"
|
61 |
+
],
|
62 |
+
"role_content_sep": "\n",
|
63 |
+
"role_empty_sep": "\n",
|
64 |
+
"stop_str": [
|
65 |
+
"<|im_end|>"
|
66 |
+
],
|
67 |
+
"stop_token_ids": [
|
68 |
+
2
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 1,
|
75 |
+
"eos_token_id": 4
|
76 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3661e5d3b89630b4f2cc1a718358dc601f07cf9e0179c74bc4eee2bc6bfecee7
|
3 |
+
size 335544320
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:772cd5cb80f0291f468611a72401ee4a660642aa7061f5633a79d163e24f4552
|
3 |
+
size 41943040
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cdb8090d9671c6a41ce7e98ee08ec12927c90e213d91742f4601573d635e7a7
|
3 |
+
size 31467520
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59d7c76d4e557cbdcdd30c856d7a065ed3f59c3f9f59a13e124652ba30fb3d6a
|
3 |
+
size 25579520
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de3855498e99473bcb46f0156cd67967bfee767fa6f5cdf3d9828db9f0ef30a8
|
3 |
+
size 36700160
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b3fac5f5deb44479850bd6238d479b2edb596a264d555de94046b2fb32b89c6
|
3 |
+
size 29501440
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bb92dba4d259dddaa2caa58f3416961af2bff3bdb8855c19b4450c4760af2f6
|
3 |
+
size 73400320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c12e4c1d46eaeaa8228cab53e94b8ecd92345967f2e3e2afd4a61a5fba8979c
|
3 |
+
size 31467520
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b20a73dc0694487602f6a8bd859eccd17d7b1f761fdcd7f3d8b97b1921fd858b
|
3 |
+
size 36700160
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c49e2c37fe39d44da60e744f5108be30b0f1685843bba03a720e14962f32787
|
3 |
+
size 73400320
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fc2e856d750a53dd1e73f58163139fc45039badc41169e9ca49ce880e44656c
|
3 |
+
size 25579520
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6b9ec7330e23b0f46788fa71daab07d41f2eee72f2179f6e74a04ab124289e1
|
3 |
+
size 36700160
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d8e352072aa913a2d7500fcbb4ca51a0e046d9c31a9925eea0391d5e5e6f1d
|
3 |
+
size 29501440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52f84b665bf0c798de5d91fb7a98816f6ee1cec86515d0f41e46812fbe72c763
|
3 |
+
size 36700160
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5703f0a68f822a87f9cca4aa5fac00d0d916330ef05d4f2169d32c9b6b9e1099
|
3 |
+
size 73400320
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77442da9d6488d110d09b8bfb11904b091def28f3787724a2f798aaf9b694396
|
3 |
+
size 31467520
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ef50cee3c804b3e430ea40efcab7a3023604b59722854439b66acead73791e0
|
3 |
+
size 73400320
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee4add7cd4eaa1b7ec71a6e906757eba405c7358318638a4e143e6bb3d3547c1
|
3 |
+
size 20971520
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff1155467eadd956a2266277ce8580a4bd1b20b435722b8d02e453b1886638dd
|
3 |
+
size 36700160
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79add91f9723f2859e5ef0f5ea70bbd6ad5dc783ec9f43324289ecf3eea617b9
|
3 |
+
size 29501440
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b0b754423f7f2b49f9928089f5f6341e099ac9e51e735607b3cfe13cc6524fc
|
3 |
+
size 36700160
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52900c2bafd0a12de7621d62293715da7bb1a4843f4781a73ca87e75f25d1c94
|
3 |
+
size 73400320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:955ff291623a557438fcdfb894a87d78b62536abb9ef1a9d3e7bc15593c7ce84
|
3 |
+
size 18380800
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:854c07e81df6fd72e31c14e82d6e9e4943237cc1d9a8e46d61a41697b4c45591
|
3 |
+
size 36700160
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36de2727a785cda75cdab239a037fe7f1b053e614639c28dbaf796aabac93bfd
|
3 |
+
size 73400320
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30fe19955397084c3af3acc53a2e3a1f467e89dcc0e7bf46d55ed7fa5fcbf36a
|
3 |
+
size 29501440
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4012b505c36b8e9d704381caef0d890714f6eb7fbe81608d681979b38acbce4
|
3 |
+
size 73400320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bbc38294e76e4fe0548208364c1e65686257fc775f80c76c43d1a3a46af9267
|
3 |
+
size 31467520
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd7c6a9b0b8a52209b1806f2f416d1e2a04f48e6090f622911811fa6879ce997
|
3 |
+
size 36700160
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10f784443a4708e4ba31225c6e9b7f99be6127fff4d318dc9be0f0d015d2654a
|
3 |
+
size 73400320
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d4cf1d002e43e28f0b1ae7b2d22a972af65c4577300d35144ed62168287b366
|
3 |
+
size 25579520
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4718cb1ba4d280a41cd3d0884d8a28e9c5864335371bbc6fc7c6e0c3884e664b
|
3 |
+
size 36700160
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a58e6e7fda97c47554959318773aa2de4d302d99fb98d0cfd01cc3882cad3a3
|
3 |
+
size 29501440
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:433f13db6ae47fea87bd7f02fee1e413340225a1c1e55571d2e7797cb9389eff
|
3 |
+
size 73400320
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd1fc12b729af2d48f9cb07cb86d9258740b2ec549c7917ee2be718b4b5f2949
|
3 |
+
size 31467520
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:791c2bb0e340f873388ae10e13086d089e279b1eebda42bf66e6b897dfcf6b0f
|
3 |
+
size 25579520
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dfc60bfd8111f9d06911ccb00e94a6e601f926d13b741ac108527f6119e4ea0
|
3 |
+
size 36700160
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77e646fc4f6c7788dfeafd387fec019cfc3bcd2e7e499c3a35bd5df2016fb64d
|
3 |
+
size 73400320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6349747debdd9cef3ce5d613d8ede9d1c5c5d2f05ff2f25b7030585e4b68be84
|
3 |
+
size 25579520
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a164dbdfe07474ac09cd33061f7e86366dad3092b7871ed0eb0ef0507abfcea6
|
3 |
+
size 36700160
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:604e46fefd3c8bb1d2d840718f3e8d3c7a105bbca996a0d1f1b026ef9d1b8bcf
|
3 |
+
size 29501440
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8708dc34c92203229c0c51fa171e66b34a0f9981bcb95b011a86a2d03e6763e0
|
3 |
+
size 73400320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be04cf2bc25d7b89156ba088b43a075926ffbac0182e76fa967aabd5e2bdd5b
|
3 |
+
size 31467520
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96408b161665861cf7f491735b73d540fd22a2ce39292a33146e4afede694fac
|
3 |
+
size 36700160
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c1f4be0adee00d32e8c3ba7fbb894cd93dc19ab2b28b9d09a7f4db778a6216d
|
3 |
+
size 73400320
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2be3c43362ab256a0d174ed4636c7295bd0e7753a074808631c7a7e876dc863
|
3 |
+
size 25579520
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61f3666fed6c59d4fa70fb63859daf30ad9a86f9a0b95374b17e5f4f87c4d4f5
|
3 |
+
size 36700160
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5894ca1831c55ca27bbfda7a36561ee7b6dc3efd4c7f13777aa73a0ae53430e
|
3 |
+
size 36700160
|