Upload folder using huggingface_hub
Browse files- .gitattributes +1 -0
- chat_template.jinja +1 -0
- model-00001-of-000017.safetensors +3 -0
- model-00002-of-000017.safetensors +3 -0
- model-00003-of-000017.safetensors +3 -0
- model-00004-of-000017.safetensors +3 -0
- model-00005-of-000017.safetensors +3 -0
- model-00006-of-000017.safetensors +3 -0
- model-00007-of-000017.safetensors +3 -0
- model-00008-of-000017.safetensors +3 -0
- model-00009-of-000017.safetensors +3 -0
- model-00010-of-000017.safetensors +3 -0
- model-00011-of-000017.safetensors +3 -0
- model-00012-of-000017.safetensors +3 -0
- model-00013-of-000017.safetensors +3 -0
- model-00014-of-000017.safetensors +3 -0
- model-00015-of-000017.safetensors +3 -0
- model-00016-of-000017.safetensors +3 -0
- model-00017-of-000017.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer_config.json +11 -11
.gitattributes
CHANGED
|
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
figures/benchmark.jpg filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
figures/benchmark.jpg filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
chat_template.jinja
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<|Assistant|><|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<|tool▁call▁end|>'}}{%- set ns.is_first = true -%}{%- else %}{{'\n' + '<|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<|tool▁call▁end|>'}}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<|tool▁outputs▁end|>' + message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<|Assistant|>' + content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<|tool▁outputs▁begin|><|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\n<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<|tool▁outputs▁end|>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<|Assistant|><think>\n'}}{% endif %}
|
model-00001-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f57a2538539d61f9f22785d3c48f089227829948ee66572808dd13d5b08d63e
|
| 3 |
+
size 8946552810
|
model-00002-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f948c2df3e4f3e678e1b4c75b345ce646c4843a23e7c9089462cf3995d2af45
|
| 3 |
+
size 8690800055
|
model-00003-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa4b0afa70d26873dabc927e59b7dbc24a0e8eda323d4fdba17927d316d3516c
|
| 3 |
+
size 1577092016
|
model-00004-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:077f51bc9eb56b50868cb95c7cf0d6d0f0a524b824ba3af8b248c78a46593e97
|
| 3 |
+
size 8690767122
|
model-00005-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e826381017b2d8a9d8704be34ee0e0ceeb0a3a9abca27beaa4555d370d5a4f10
|
| 3 |
+
size 8422331428
|
model-00006-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1d4326d0d4187830fcea956d8ccfafbf6871fa7baed1b759c1ed843cafe92c0
|
| 3 |
+
size 8690767122
|
model-00007-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62a83ba7af95d532065e46322ae2c17ee020c3c8e92b7285420c09ca0d6f68f0
|
| 3 |
+
size 8422331428
|
model-00008-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8189753d14d5f9b3c31466d1f5a185bb7ffc7fc346cbc06a5453e48e07c2b97b
|
| 3 |
+
size 8690767122
|
model-00009-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:928bea3ae97c3962b3eb3f51a66f674be4cd5858caae541becd3e175f3305403
|
| 3 |
+
size 8422331428
|
model-00010-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1db6d4f8387897b0f40e505310a1542f6d0308370526fa86c42cdc99451d2200
|
| 3 |
+
size 8690767122
|
model-00011-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31a5eb90d0773f1514ae7b240ed62961412e48f9eb160fdac6226221b87fe61f
|
| 3 |
+
size 8422331428
|
model-00012-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d01c2823a0393ded7f97556995b69965dad78665664853f1c8a2be901e643a44
|
| 3 |
+
size 8690767122
|
model-00013-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c43532c1b128f0135edc587ace540dfa53759916836960db06b73ab718e5eca
|
| 3 |
+
size 8422331428
|
model-00014-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f2ce0194b017ae009448602d7fd4ac24d7f25059c0a87d42fc496000f7bdacc
|
| 3 |
+
size 8690767122
|
model-00015-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:572ed974eb237aacf3de9ddfeaa373c62d39038a96ffd7f2beec6ea8f8a7b16e
|
| 3 |
+
size 8422331428
|
model-00016-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5a581377b62f0a918bf515d05f2514281eec031ea2748e7ce8123b910403bba
|
| 3 |
+
size 8690767122
|
model-00017-of-000017.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:605b29e86ec80aaa3a38bb3aab4bc859e4df26928fe49bbca00f127f55897e8d
|
| 3 |
+
size 10523694303
|
model.safetensors.index.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
CHANGED
|
@@ -4,7 +4,7 @@
|
|
| 4 |
"add_prefix_space": null,
|
| 5 |
"added_tokens_decoder": {
|
| 6 |
"128000": {
|
| 7 |
-
"content": "
|
| 8 |
"lstrip": false,
|
| 9 |
"normalized": false,
|
| 10 |
"rstrip": false,
|
|
@@ -12,7 +12,7 @@
|
|
| 12 |
"special": true
|
| 13 |
},
|
| 14 |
"128001": {
|
| 15 |
-
"content": "
|
| 16 |
"lstrip": false,
|
| 17 |
"normalized": false,
|
| 18 |
"rstrip": false,
|
|
@@ -92,7 +92,7 @@
|
|
| 92 |
"special": true
|
| 93 |
},
|
| 94 |
"128011": {
|
| 95 |
-
"content": "
|
| 96 |
"lstrip": false,
|
| 97 |
"normalized": false,
|
| 98 |
"rstrip": false,
|
|
@@ -100,7 +100,7 @@
|
|
| 100 |
"special": false
|
| 101 |
},
|
| 102 |
"128012": {
|
| 103 |
-
"content": "
|
| 104 |
"lstrip": false,
|
| 105 |
"normalized": false,
|
| 106 |
"rstrip": false,
|
|
@@ -124,7 +124,7 @@
|
|
| 124 |
"special": false
|
| 125 |
},
|
| 126 |
"128015": {
|
| 127 |
-
"content": "
|
| 128 |
"lstrip": false,
|
| 129 |
"normalized": false,
|
| 130 |
"rstrip": false,
|
|
@@ -2052,17 +2052,17 @@
|
|
| 2052 |
"special": true
|
| 2053 |
}
|
| 2054 |
},
|
| 2055 |
-
"bos_token": "
|
| 2056 |
-
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<|Assistant|><|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<|tool▁call▁end|>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<|tool▁call▁end|>'}}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<|tool▁outputs▁end|>' + message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<|Assistant|>' + content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<|tool▁outputs▁begin|><|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<|tool▁outputs▁end|>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<|Assistant|><think>\\n'}}{% endif %}",
|
| 2057 |
"clean_up_tokenization_spaces": false,
|
| 2058 |
-
"eos_token": "
|
| 2059 |
"extra_special_tokens": {},
|
| 2060 |
"legacy": true,
|
| 2061 |
-
"model_max_length":
|
| 2062 |
"pad_token": "<|finetune_right_pad_id|>",
|
| 2063 |
"padding_side": "left",
|
| 2064 |
"sp_model_kwargs": {},
|
| 2065 |
"tokenizer_class": "LlamaTokenizerFast",
|
| 2066 |
"unk_token": null,
|
| 2067 |
-
"use_default_system_prompt": false
|
| 2068 |
-
}
|
|
|
|
|
|
| 4 |
"add_prefix_space": null,
|
| 5 |
"added_tokens_decoder": {
|
| 6 |
"128000": {
|
| 7 |
+
"content": "<\uff5cbegin\u2581of\u2581sentence\uff5c>",
|
| 8 |
"lstrip": false,
|
| 9 |
"normalized": false,
|
| 10 |
"rstrip": false,
|
|
|
|
| 12 |
"special": true
|
| 13 |
},
|
| 14 |
"128001": {
|
| 15 |
+
"content": "<\uff5cend\u2581of\u2581sentence\uff5c>",
|
| 16 |
"lstrip": false,
|
| 17 |
"normalized": false,
|
| 18 |
"rstrip": false,
|
|
|
|
| 92 |
"special": true
|
| 93 |
},
|
| 94 |
"128011": {
|
| 95 |
+
"content": "<\uff5cUser\uff5c>",
|
| 96 |
"lstrip": false,
|
| 97 |
"normalized": false,
|
| 98 |
"rstrip": false,
|
|
|
|
| 100 |
"special": false
|
| 101 |
},
|
| 102 |
"128012": {
|
| 103 |
+
"content": "<\uff5cAssistant\uff5c>",
|
| 104 |
"lstrip": false,
|
| 105 |
"normalized": false,
|
| 106 |
"rstrip": false,
|
|
|
|
| 124 |
"special": false
|
| 125 |
},
|
| 126 |
"128015": {
|
| 127 |
+
"content": "<\uff5c\u2581pad\u2581\uff5c>",
|
| 128 |
"lstrip": false,
|
| 129 |
"normalized": false,
|
| 130 |
"rstrip": false,
|
|
|
|
| 2052 |
"special": true
|
| 2053 |
}
|
| 2054 |
},
|
| 2055 |
+
"bos_token": "<\uff5cbegin\u2581of\u2581sentence\uff5c>",
|
|
|
|
| 2056 |
"clean_up_tokenization_spaces": false,
|
| 2057 |
+
"eos_token": "<\uff5cend\u2581of\u2581sentence\uff5c>",
|
| 2058 |
"extra_special_tokens": {},
|
| 2059 |
"legacy": true,
|
| 2060 |
+
"model_max_length": 16384,
|
| 2061 |
"pad_token": "<|finetune_right_pad_id|>",
|
| 2062 |
"padding_side": "left",
|
| 2063 |
"sp_model_kwargs": {},
|
| 2064 |
"tokenizer_class": "LlamaTokenizerFast",
|
| 2065 |
"unk_token": null,
|
| 2066 |
+
"use_default_system_prompt": false,
|
| 2067 |
+
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<\uff5cUser\uff5c>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<\uff5cAssistant\uff5c><\uff5ctool\u2581calls\u2581begin\uff5c><\uff5ctool\u2581call\u2581begin\uff5c>' + tool['type'] + '<\uff5ctool\u2581sep\uff5c>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<\uff5ctool\u2581call\u2581end\uff5c>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<\uff5ctool\u2581call\u2581begin\uff5c>' + tool['type'] + '<\uff5ctool\u2581sep\uff5c>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<\uff5ctool\u2581call\u2581end\uff5c>'}}{{'<\uff5ctool\u2581calls\u2581end\uff5c><\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<\uff5ctool\u2581outputs\u2581end\uff5c>' + message['content'] + '<\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<\uff5cAssistant\uff5c>' + content + '<\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<\uff5ctool\u2581outputs\u2581begin\uff5c><\uff5ctool\u2581output\u2581begin\uff5c>' + message['content'] + '<\uff5ctool\u2581output\u2581end\uff5c>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<\uff5ctool\u2581output\u2581begin\uff5c>' + message['content'] + '<\uff5ctool\u2581output\u2581end\uff5c>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<\uff5ctool\u2581outputs\u2581end\uff5c>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<\uff5cAssistant\uff5c><think>\\n'}}{% endif %}"
|
| 2068 |
+
}
|