Upload 150 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +76 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 131072,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": 1024000,
|
16 |
+
"sliding_window_size": -1,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80
|
21 |
+
},
|
22 |
+
"vocab_size": 131072,
|
23 |
+
"context_window_size": 1024000,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.json",
|
36 |
+
"tokenizer_config.json"
|
37 |
+
],
|
38 |
+
"tokenizer_info": {
|
39 |
+
"token_postproc_method": "byte_level",
|
40 |
+
"prepend_space_in_encode": false,
|
41 |
+
"strip_space_in_decode": false
|
42 |
+
},
|
43 |
+
"conv_template": {
|
44 |
+
"name": "chatml",
|
45 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
46 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
47 |
+
"system_prefix_token_ids": null,
|
48 |
+
"add_role_after_system_message": true,
|
49 |
+
"roles": {
|
50 |
+
"user": "<|im_start|>user",
|
51 |
+
"assistant": "<|im_start|>assistant"
|
52 |
+
},
|
53 |
+
"role_templates": {
|
54 |
+
"user": "{user_message}",
|
55 |
+
"assistant": "{assistant_message}",
|
56 |
+
"tool": "{tool_message}"
|
57 |
+
},
|
58 |
+
"messages": [],
|
59 |
+
"seps": [
|
60 |
+
"<|im_end|>\n"
|
61 |
+
],
|
62 |
+
"role_content_sep": "\n",
|
63 |
+
"role_empty_sep": "\n",
|
64 |
+
"stop_str": [
|
65 |
+
"<|im_end|>"
|
66 |
+
],
|
67 |
+
"stop_token_ids": [
|
68 |
+
2
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 1,
|
75 |
+
"eos_token_id": 4
|
76 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84982e4000775103d809fbf820b5f977a7d63fff076ea4a46ef5bcaf049cdcd9
|
3 |
+
size 335544320
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d24e9db2499a7cb90d1c132e405d0a04bb4ffd0c57ad746e0544f68bdeb179
|
3 |
+
size 41943040
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d02098bad815a1ea9b65309c17ca358b8440971b30434b05cf023eb350f360c
|
3 |
+
size 31467520
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd5a1b1e35a197f4b3170a753f1354c05d99a7f1f9677f24b7405c57fc14f514
|
3 |
+
size 25579520
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6c6c700088df7a054e821ddaadaeb931ec72f83b5eb74bb925d2a1895f5155e
|
3 |
+
size 36700160
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3da453fc48877691321c8118a376aa63c54de1b51e225b18c68f06afe3502466
|
3 |
+
size 29501440
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1367f937e3b685150f463049ed3870eda2c4b49fb14d5d68279cf55aadb98b24
|
3 |
+
size 73400320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe3aec2686f63609217593fc8f46ed699a1b1fa5f1c83f62c2ae703cabd9e1a8
|
3 |
+
size 31467520
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2437563a8fc168d56c8881ed89a32cfe9ea705dd930bd397974f703683e42d31
|
3 |
+
size 36700160
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e39e784750b3f45f598e4c50b6ead9f0c72d53cb9a82ae0d46b78612597b1e5
|
3 |
+
size 73400320
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd61cb82df7fd0ffa861b8de1da610117fdaec7a40025f834e7ca00a6de60c2f
|
3 |
+
size 25579520
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4a18b66ea70880a01dfc6bdd1472f1851a1ad69e9ca5ffde22790d950dbbc91
|
3 |
+
size 36700160
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c397af006277b557c26dbc5883aac07e6b4dd4e3a7ac287a9fc0dff5b96dfc2
|
3 |
+
size 29501440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0fcbe37a107b2797869639efbb2bba57fef1e59faeef3314e6d75a38ae407d1
|
3 |
+
size 36700160
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bd2b6dc98be375073950bbdeb9f277f123f9581a3144ddb9f2f5e3dc93fecd1
|
3 |
+
size 73400320
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b151e9a39d6b34b9a1b98be29a8577baceffb676110b369d65e01f49204cb517
|
3 |
+
size 31467520
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c69c38cb52c42b11759b72a528d8cfd05b541dfd2d485ec9651244f45a5882db
|
3 |
+
size 73400320
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:705856626f7fc52b8ea66aaec6dfb3ce7f6873f1cc1fd583563daf65975d9c5d
|
3 |
+
size 20971520
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a96353f80795168ef97c33c4532fc1a9e187532575828bd22f4c3a732ae5c57
|
3 |
+
size 36700160
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3fc674a40f6e7b5c86f2992bd7d8e99ce82ea634d52d5f3740f020d1b6f051a
|
3 |
+
size 29501440
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5da00508a1c9b286255cb76d393992174d54fa09c4c38c024f777aa26f7cd39a
|
3 |
+
size 36700160
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a347121636dec23c35d329dbb474f9c41da5a7300ad8d8624e1feff8f5476ca
|
3 |
+
size 73400320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5db7527a0c3220b5e6c95f197539da51c09d02ca26bd5b0facdd7f4b8c0d977c
|
3 |
+
size 18380800
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffe461ba161f624d78091ad296f45e09c46d01108e025a8285e0f912d4bf535d
|
3 |
+
size 36700160
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b10788984545ee6834f72fb4b3b43dc69984149623f1e5d7d0336ca377301dd
|
3 |
+
size 73400320
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1849fb5279e53737f4749f45e91eaa986c4c803a824cd068089f1a77c05ca151
|
3 |
+
size 29501440
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e40755f9dde37d98895ebc5128e2245bc4dc6f90b4836ecb0c71a34be9e24fe9
|
3 |
+
size 73400320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4d52ec9cddaee7116751e24ccfc61fb898a823ee6984fa8d8237de65039eb62
|
3 |
+
size 31467520
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf3b6d79ab98abb2a732ad85479ed5f4f791f46ce4a1383d4f6c4af27be4d5c
|
3 |
+
size 36700160
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f4d8db574b0ae5b9da6081f52738ab07c2e9162a07a64dc005c31a0f81181f
|
3 |
+
size 73400320
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0984c8d02efe9fef4719e85e43fe194799a425068d658aa0332e2cde91588ea3
|
3 |
+
size 25579520
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a5417801ee94f451030dd69aa25b2917c1ef302cc6a7512c126f76d7f38740b
|
3 |
+
size 36700160
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd194113a0782674df1901fff9a91693effc80fe803b0fd8bbc30c4806f6256f
|
3 |
+
size 29501440
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f129b4d0d82346649457141099c2b06319bc2ea9175a78420be665e0cabce9f
|
3 |
+
size 73400320
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e21c45c6b9bedb4808806298f5a421273c633228d8a819ef01c2646cf1293390
|
3 |
+
size 31467520
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3ff23a1686b9f9f3d1f704f56c4f2341dceff9c3082a97a06568e20d7d3ac97
|
3 |
+
size 25579520
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ecafb535674f8bd5cfc3789ed03e00f1effa20f21e869af8b65f8b0c8db8ed0
|
3 |
+
size 36700160
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a06f3fcd6e0e7436496ff86f007ecc43365f7b3bcbcf328302e76e6abd8e55b2
|
3 |
+
size 73400320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6651214d475f352f2c297d9fc6e085ce44ebbd22de26c7a36861158154dfcf6e
|
3 |
+
size 25579520
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e85034fefbae8767f245d78ee6a6f11a9fa188a558838f9e859abf5273d3e303
|
3 |
+
size 36700160
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bed10862ebb13d4622a2512fd4708bf70232040ace51bf3cb90357566c1a5737
|
3 |
+
size 29501440
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2704f76ae2e56394a1bf155c97443e854473517cef539eeaedb7ea777310c65
|
3 |
+
size 73400320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9233a428324095946b07eb5bab35f220676b204c091d5d382fb140a5f5c50e1
|
3 |
+
size 31467520
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebd983dfb56a57f42796106622b746e575d8f6213566b7f40380a1d5cdbb6e99
|
3 |
+
size 36700160
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10d646bee23a432a79574fee6a34ac632df70f1548a9595a9279e6a74987710a
|
3 |
+
size 73400320
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d56c54f6d703fb488f6951081004186a2ed84578cf468ec16a0e6f15a4d409d
|
3 |
+
size 25579520
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c42c9ce697e200d95381690078ff015aacec5692c201f98561994d7b0b838ea7
|
3 |
+
size 36700160
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bc8357e8391f3070ffaabdaa800cbce7a98ca39fb68ee5494a9ec114ba1628a
|
3 |
+
size 36700160
|