Upload 152 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- merges.txt +0 -0
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 131072,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": 1024000,
|
16 |
+
"sliding_window_size": -1,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80
|
21 |
+
},
|
22 |
+
"vocab_size": 131072,
|
23 |
+
"context_window_size": 1024000,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.json",
|
36 |
+
"vocab.json",
|
37 |
+
"merges.txt",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_level",
|
42 |
+
"prepend_space_in_encode": false,
|
43 |
+
"strip_space_in_decode": false
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "chatml",
|
47 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
48 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
49 |
+
"system_prefix_token_ids": null,
|
50 |
+
"add_role_after_system_message": true,
|
51 |
+
"roles": {
|
52 |
+
"user": "<|im_start|>user",
|
53 |
+
"assistant": "<|im_start|>assistant"
|
54 |
+
},
|
55 |
+
"role_templates": {
|
56 |
+
"user": "{user_message}",
|
57 |
+
"assistant": "{assistant_message}",
|
58 |
+
"tool": "{tool_message}"
|
59 |
+
},
|
60 |
+
"messages": [],
|
61 |
+
"seps": [
|
62 |
+
"<|im_end|>\n"
|
63 |
+
],
|
64 |
+
"role_content_sep": "\n",
|
65 |
+
"role_empty_sep": "\n",
|
66 |
+
"stop_str": [
|
67 |
+
"<|im_end|>"
|
68 |
+
],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a8330d0ee37209a494eb30793dc8dfcef84dfd27de5a0b499f308bc3f37f538
|
3 |
+
size 335544320
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46f809b461ebc23a694dcbbdcc88445f6b89e0d810e7d5a9a49f9ed71220c719
|
3 |
+
size 41943040
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae3cd6efb8fcd3710744a1f850f46fba46bdf866ee0d460e4def141185a785a0
|
3 |
+
size 31467520
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42cca3aad8df60291ed5a0abfc5cd7e934f4887cf330b827bceccd39f49b3bb6
|
3 |
+
size 25579520
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f5257d69903087ba8f5bb2c86271c608fed8d6c746897b1da7cdb961b464e32
|
3 |
+
size 36700160
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba5c54634e7cb81aaee0e01f8359e454875684bf180955709e7d4611e65f0324
|
3 |
+
size 29501440
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2c71af75dbcd2eb66a137c40434094485f38e6fee56436cfc2a73d3eb1d3c9c
|
3 |
+
size 73400320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6159bfd5c9a6dbed670d43d402e040894907a23e375d249edfb9a2d3986f7dd3
|
3 |
+
size 31467520
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8ef40fd172228e7c9fbee38fca017ccabd3b11af3505f2f6f7450fd31de489a
|
3 |
+
size 36700160
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eae29d9aefd8406c0e45989bcef0d4ce03bf718de164851fc815409bc53dcc86
|
3 |
+
size 73400320
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cf00c9710d9163c935b0f4c67cda4c6b1fc69f71f1283e7c9d6d892c53e9d71
|
3 |
+
size 25579520
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c5e34cba7ec4151035b16c2e7aa269d2ffd99e5330dae2ad8dfe9d8ba8fec1e
|
3 |
+
size 36700160
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83a84e1c661d9ca26915e55303f21a79a286cb2b38e8f80366b73fbc45faf1e9
|
3 |
+
size 29501440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:756218ea7ad0f24204253c7746bc2434f9e9308587bd149a39a3a58be6fe7fba
|
3 |
+
size 36700160
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79e579d80f3a544260bec90380aab7029b773768fed8bb8384a4e35e6a4289ff
|
3 |
+
size 73400320
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acae1a91f35aa4fd64b7aab0cf778951401ecc0736b7cc4c584ef7ec557e702d
|
3 |
+
size 31467520
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fa6faa0e0b06cf55e4be26d210e548fdce6521d617daa392b3f2c3704f0ad5a
|
3 |
+
size 73400320
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d25f12b4e7637f7f6dec461ed5540a82f083fa690087ccdf004fd2deb5fa89e4
|
3 |
+
size 20971520
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd7f5bdf461ef243910f979529a8f656d5d44ccf33cfb1b1cb8a4f291497f3e4
|
3 |
+
size 36700160
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2411399dfb230cedc5f62a17c120d9fd009f07ee50bae679ec41ff0107a6eec7
|
3 |
+
size 29501440
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c1a2f6e50619e2b81b25321e188fbba04156249b26ece5782a66abc9c578f2c
|
3 |
+
size 36700160
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f94f78fc9144f4eb33665af73cf1875d9b85272a7f8feb2e2d8cc6675fef4c5
|
3 |
+
size 73400320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccd57c033da9359505dd32b88b0e3745c62d466f206a941149b62409c24f6cea
|
3 |
+
size 18380800
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f0d52c41ef7d52593252919093ea91e6073445d848b21e447eab8e89fd15d82
|
3 |
+
size 36700160
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08f10bf7fb8bd0764ef69752ce69baef7bcf939979fd72fbe095669df8728bc7
|
3 |
+
size 73400320
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ee445d1aeaebe720ddedb3a078e4c6f70f086bd5437756b1cc59ee2648049aa
|
3 |
+
size 29501440
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44ea5461b674af66784cd08dfde52a09c5878e0eb12983551c9a3c9677daabf1
|
3 |
+
size 73400320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cb6674d409875f004c602a388d9581e1a529b81c437cf0f931b5b83005c5a9d
|
3 |
+
size 31467520
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f00cfc391a01f2f9f73d9db762eee74424bf528d413fed682a37e88ab54a675
|
3 |
+
size 36700160
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab275a27a55f1bb05746b01b9c50e567c55e59a53ac56bfc7fe8133e22daadf
|
3 |
+
size 73400320
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa9fd41e96cdbf974fc0184b0e6927db08d67ed1c783d2f3b3add76f97cc8e7d
|
3 |
+
size 25579520
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee8347a46014290caa3752e6e1d31c54a4317fb783a7fc1da8dc4bfe8df650f2
|
3 |
+
size 36700160
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9475325819f5cfb408749267a71df765a9993c2067d55d7c531d41ac04df8fe7
|
3 |
+
size 29501440
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42391ba9f031b634afc3c83299225ac3d927e962fe6b852d659223f7ee1293c7
|
3 |
+
size 73400320
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61d4aa7074054d3d0b152a1f6dea3be6feca6a327ccdc275f9894da022685e95
|
3 |
+
size 31467520
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa35f6549cc634ae950000f5bab5f4d247ffd812e131f6d35dbc0b53837462cd
|
3 |
+
size 25579520
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:449756dcaba2feb51904980879d250a8d1b0356984cbb7ca26aa7e6ffcde4fa7
|
3 |
+
size 36700160
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6f711b4c0f82ff5f49e95154607b9a304557743d79532e9658a4b1db33d3e58
|
3 |
+
size 73400320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0835f8ded49d08a4e0a428d2c0a26e4aa51e0ee936d584e6f7421c2f51c6254e
|
3 |
+
size 25579520
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d252ae22993727341af7fffffe10528a5988102f68ef066573352613a2306bb8
|
3 |
+
size 36700160
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee8527910020728f22bafdea38d13a6a20dca77332c616517fad2034d91559ca
|
3 |
+
size 29501440
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f8440e5638a8cef2a3c8a10a4f0f47365077f8f6d3a6b191e44b77b0c7751a5
|
3 |
+
size 73400320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec01698fd4f599034e7f2d5e64ac902bd08446d2b8dfdf7196778751f3240d24
|
3 |
+
size 31467520
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce76519eaf0817fe73d781f9d1fb5f7010f148c30d90ee68e92a322eb4e808e7
|
3 |
+
size 36700160
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7df6f79966e8646771e36c9bfad910bac99d085bfe76e8a4085c65d8db9fc32e
|
3 |
+
size 73400320
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc0ff37cb6596868cf714d0194d3d7023be074cc2bd9378442d94d644506d3b2
|
3 |
+
size 25579520
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac9457552443c98c196a1f359999b5e56d282918df1f208c4662a7372eab7ae7
|
3 |
+
size 36700160
|