upload 1-50
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +84 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_6.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,84 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma2",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 3584,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"attention_bias": false,
|
9 |
+
"num_attention_heads": 16,
|
10 |
+
"num_key_value_heads": 8,
|
11 |
+
"head_dim": 256,
|
12 |
+
"num_hidden_layers": 42,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"vocab_size": 256000,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000.0,
|
17 |
+
"context_window_size": 4096,
|
18 |
+
"prefill_chunk_size": 4096,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 128,
|
21 |
+
"attn_logit_softcapping": 50.0,
|
22 |
+
"final_logit_softcapping": 30.0,
|
23 |
+
"query_pre_attn_scalar": 256,
|
24 |
+
"sliding_window": 4096
|
25 |
+
},
|
26 |
+
"vocab_size": 256000,
|
27 |
+
"context_window_size": 4096,
|
28 |
+
"sliding_window_size": -1,
|
29 |
+
"prefill_chunk_size": 4096,
|
30 |
+
"attention_sink_size": -1,
|
31 |
+
"tensor_parallel_shards": 1,
|
32 |
+
"pipeline_parallel_stages": 1,
|
33 |
+
"temperature": 1.0,
|
34 |
+
"presence_penalty": 0.0,
|
35 |
+
"frequency_penalty": 0.0,
|
36 |
+
"repetition_penalty": 1.0,
|
37 |
+
"top_p": 1.0,
|
38 |
+
"tokenizer_files": [
|
39 |
+
"tokenizer.model",
|
40 |
+
"tokenizer.json",
|
41 |
+
"tokenizer_config.json"
|
42 |
+
],
|
43 |
+
"tokenizer_info": {
|
44 |
+
"token_postproc_method": "byte_fallback",
|
45 |
+
"prepend_space_in_encode": false,
|
46 |
+
"strip_space_in_decode": false
|
47 |
+
},
|
48 |
+
"conv_template": {
|
49 |
+
"name": "gemma_instruction",
|
50 |
+
"system_template": "{system_message}",
|
51 |
+
"system_message": "",
|
52 |
+
"system_prefix_token_ids": [
|
53 |
+
2
|
54 |
+
],
|
55 |
+
"add_role_after_system_message": true,
|
56 |
+
"roles": {
|
57 |
+
"user": "<start_of_turn>user",
|
58 |
+
"assistant": "<start_of_turn>model"
|
59 |
+
},
|
60 |
+
"role_templates": {
|
61 |
+
"user": "{user_message}",
|
62 |
+
"assistant": "{assistant_message}",
|
63 |
+
"tool": "{tool_message}"
|
64 |
+
},
|
65 |
+
"messages": [],
|
66 |
+
"seps": [
|
67 |
+
"<end_of_turn>\n"
|
68 |
+
],
|
69 |
+
"role_content_sep": "\n",
|
70 |
+
"role_empty_sep": "\n",
|
71 |
+
"stop_str": [
|
72 |
+
"<end_of_turn>"
|
73 |
+
],
|
74 |
+
"stop_token_ids": [
|
75 |
+
1,
|
76 |
+
107
|
77 |
+
],
|
78 |
+
"function_string": "",
|
79 |
+
"use_function_calling": false
|
80 |
+
},
|
81 |
+
"pad_token_id": 0,
|
82 |
+
"bos_token_id": 2,
|
83 |
+
"eos_token_id": 8
|
84 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0e6211a1f3cec7694c3f67b288aeac54902949207a1ca41ff8a0ddb37542976
|
3 |
+
size 458752000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbbcce0e575587bdfbc3886a28f59e4250b17a3cb10a1308090bc059456f7b8c
|
3 |
+
size 57344000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5444844f3ac989e6eee210e416e98e03fb029a60d5fdaf6b819759408bbaf689
|
3 |
+
size 25690112
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42284b63719264f877519b186d02e3c4cb91cd8b3f2ad21df2b41f65b924ce9b
|
3 |
+
size 31223808
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b4600c79b0f8c8df5d24ce0df697fd8f9768d04ced5775119750ebfb2aaf856
|
3 |
+
size 51380224
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c544ec96600d3e71d5cf6d1da8f6e3749ef896898ba9d80406fc01ce55d2bb52
|
3 |
+
size 33510400
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e25d82e23760619ab5d3347e924b4658602ba10f3881dce42ac4fe9ee2159e5a
|
3 |
+
size 51380224
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:972f6271260c9abdb619bcad1092a919af3b0ccfbe268eb4891647051e0fc90f
|
3 |
+
size 29826048
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20808f9fc18faa1fdc8da590071646065dc7b1772b70022d4541c772f65a13e6
|
3 |
+
size 25690112
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d33d1dec81b4460da6e3204663b820169de67b1b390e0d4394a86b5c5e6d9c6
|
3 |
+
size 31223808
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1221955078fa09a4c6d9bf1e9b0cc738279a1b312ee575d4d48512e737ea6453
|
3 |
+
size 51380224
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a9ba84e92e416bfb7283651ce68def7827bada369908cd6b19ded0c02efa288
|
3 |
+
size 33510400
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3b4e85bec5375fb7ccc9c3fe462016a91d262b29b9b3d8be8aa02fd6a232035
|
3 |
+
size 51380224
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfcaeb9be09e15d5ea449e18882018f71c7370cac6c4decc4ff233b81cfc40d1
|
3 |
+
size 51380224
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a48695df82177d7c0f8a77ba6d70aecd7596dd7cb2c034731df3fe1e1c53543
|
3 |
+
size 29826048
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe2b354f781f477ef6e37a8bfe77e827f64b0e8527918895138d78c8c9eb4dad
|
3 |
+
size 51380224
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3729c43cc0c224c6a4d43d6df8c8a88e79c66a1a4aa1c8ed2b97b8addf42a83
|
3 |
+
size 31216640
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187498a0d7777d45d22d74d9d4e7fbfe483f4fa729e84143a9b61149de5a9766
|
3 |
+
size 25690112
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcaa5ba814d285e6982580e111056a981f03bb4f2fea6e2b4de5983df28a0aaf
|
3 |
+
size 31202304
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b78341cd4084fe4dcd3d4fcf87a6d417f4119335e16625337e57dde53cf6cbe4
|
3 |
+
size 51380224
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8313eeea86bef7286edbf3b0e92f0f08c41abd8bfd45ac97dc72cdfcc63f2e80
|
3 |
+
size 33510400
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b410af5a4ff028ac456e4cf9d91da0bfaf18ca16817f767d0af342c93f23a3b7
|
3 |
+
size 51380224
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:602a1d1307a9ae895937fda304632f9419cb3c5d2bf94fb06053a4eaa787814c
|
3 |
+
size 29826048
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcee150065f57b0cf4d0c34fbafe2fcbc27b9084aee62b7d585ae78261e5baa1
|
3 |
+
size 28908544
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4441c72241f6fad4c2044926cdbff608fb524e2584bbf4d66178b51085435388
|
3 |
+
size 25690112
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76fd68a4579b31f19af939808b6dc1fdf0ec92d3c1ef59080176022305490db0
|
3 |
+
size 31223808
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4a73b0eccfc89cc4652cc18385e224ef04ac08c7f8af76c74db606ea13333b7
|
3 |
+
size 51380224
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7959050222dd1a64f37c8b44d74710272eaab2087ede733aec051799f06fc384
|
3 |
+
size 33510400
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81fb7b1cd8d9fe7c71cfea0e4c3318d4a66d2b2393b19569b9f4e1ad9aa96a7f
|
3 |
+
size 51380224
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da0d59630afe6c020b348b7f9e6af0fb8d87a8b812881aa8f81e9afafe4f5101
|
3 |
+
size 29826048
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c270a4af0c2cc353e6d499909b199577aa5e789194d659fdc1b92e7570a5b388
|
3 |
+
size 25690112
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4cb74198759a34cbebff3c64ebbffbe9ed8a2a3b441731a3c44c695dc9b7939
|
3 |
+
size 31223808
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a8dac87a997f5b55b30cc873df2ac4a92d31411ab89f9dbd55f5e7e53157a3a
|
3 |
+
size 51380224
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77fbb4753a7d47d0b5696261a662397554c553f88bc891741a175e0685976333
|
3 |
+
size 33510400
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bc70485985b972cf6bc8f55cd908d9a19bbf0dc9e6346ea2370ee9b48db8722
|
3 |
+
size 25690112
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e255a4f3a0335ed1751069c35600fc476f7bca029c126aa2350e591cb50d0aa7
|
3 |
+
size 51380224
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e08650c39e6cd8bb7aa7f6dc229554c176cf5dfe7ce68d2d377300f92b9e2bf8
|
3 |
+
size 29826048
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c70967d54d7af00380d808bd95fc188e461e3aeb8fa52a911dd1671e64adf0e2
|
3 |
+
size 25690112
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd6f9dd6796c53554ac16c7023ed2d82c6d3942c05e907cbc8f554f2ff914b96
|
3 |
+
size 31223808
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91ab6f6c814e025534dd6d21f3c803a000f30b0ec364c346b28c42191fff7090
|
3 |
+
size 51380224
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8712b48856c5a0879422221774a7a880a8285e36d758aed0d888b6e91232c8dc
|
3 |
+
size 33510400
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e13732b4d7454f0f50f59c7041ba03cf2432c450d505584df880cb23b8133d5
|
3 |
+
size 51380224
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e75bd30a6f8cbcf572a16324d1d6c85c86ad97a96806672747cb60ab755eedb
|
3 |
+
size 29826048
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cb1a433e369a05ab593be1da82283c592122beb4386c3190276bda8118afdde
|
3 |
+
size 25690112
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c2a6e1a9946549712420127f86da7d7f9fa7c7527c32c1054a2be5e67e157c4
|
3 |
+
size 31223808
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a1dfd6775b73cc38ebde30cf7eaa53d1d2df07f8f1618fe5841196360124211
|
3 |
+
size 31223808
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4bc21841a2905989bf539baca60599abc5fec825626b863330c645304e6eded
|
3 |
+
size 51380224
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e47731f5787cd41ea7fc4b4c2b4b75d5fc68512a73b907c5f095a832c0ec897
|
3 |
+
size 51380224
|