update

Files changed (6) hide show

config.json CHANGED Viewed

@@ -25,7 +25,7 @@
   "rope_theta": 100000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.38.1",
   "use_cache": true,
   "vocab_size": 32256
 }

   "rope_theta": 100000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.41.0.dev0",
   "use_cache": true,
   "vocab_size": 32256
 }

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:995a68cf76915b5ad450690e43655ac6fac9e2b1f0c6b96ffc8616f6f3819b25
 size 4971750904

 version https://git-lfs.github.com/spec/v1
+oid sha256:c01f2b54cbc01ee79565279165446a0a470ed66d0d3f892c368aaeffd9018898
 size 4971750904

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2bddb316f61128d1bba3c8fdc23b22503fe98e0d2612dc5ce4e55e9350d3313
-size 2235727984

 version https://git-lfs.github.com/spec/v1
+oid sha256:1fab83d3cad51065ab6d1f4874a5e825ee097a777595084c4f879ccab6c2c7ae
+size 2235727976

model.safetensors.index.json CHANGED Viewed

@@ -742,7 +742,7 @@
     "model.layers.9.self_attn.v_proj.qzeros": "model-00001-of-00002.safetensors",
     "model.layers.9.self_attn.v_proj.scales": "model-00001-of-00002.safetensors",
     "model.norm.weight": "model-00002-of-00002.safetensors",
-    "trtllm_bits": "model-00002-of-00002.safetensors",
-    "trtllm_groupsize": "model-00002-of-00002.safetensors"
   }
 }

     "model.layers.9.self_attn.v_proj.qzeros": "model-00001-of-00002.safetensors",
     "model.layers.9.self_attn.v_proj.scales": "model-00001-of-00002.safetensors",
     "model.norm.weight": "model-00002-of-00002.safetensors",
+    "trt_bits": "model-00002-of-00002.safetensors",
+    "trt_groupsize": "model-00002-of-00002.safetensors"
   }
 }

tokenizer.json CHANGED Viewed

@@ -321,6 +321,7 @@
     "end_of_word_suffix": null,
     "fuse_unk": false,
     "byte_fallback": false,
     "vocab": {
       "!": 0,
       "\"": 1,

     "end_of_word_suffix": null,
     "fuse_unk": false,
     "byte_fallback": false,
+    "ignore_merges": false,
     "vocab": {
       "!": 0,
       "\"": 1,

tokenizer_config.json CHANGED Viewed

@@ -183,7 +183,6 @@
   "chat_template": "{% if not add_generation_prompt is defined %}\n{% set add_generation_prompt = false %}\n{% endif %}\n{%- set ns = namespace(found=false) -%}\n{%- for message in messages -%}\n    {%- if message['role'] == 'system' -%}\n        {%- set ns.found = true -%}\n    {%- endif -%}\n{%- endfor -%}\n{{bos_token}}{%- if not ns.found -%}\n{{'You are an AI programming assistant, utilizing the Deepseek Coder model, developed by Deepseek Company, and you only answer questions related to computer science. For politically sensitive questions, security and privacy issues, and other non-computer science questions, you will refuse to answer\\n'}}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n{{ message['content'] }}\n    {%- else %}\n        {%- if message['role'] == 'user' %}\n{{'### Instruction:\\n' + message['content'] + '\\n'}}\n        {%- else %}\n{{'### Response:\\n' + message['content'] + '\\n<|EOT|>\\n'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{% if add_generation_prompt %}\n{{'### Response:'}}\n{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|EOT|>",
-  "legacy": true,
   "model_max_length": 16384,
   "pad_token": "<｜end▁of▁sentence｜>",
   "sp_model_kwargs": {},

   "chat_template": "{% if not add_generation_prompt is defined %}\n{% set add_generation_prompt = false %}\n{% endif %}\n{%- set ns = namespace(found=false) -%}\n{%- for message in messages -%}\n    {%- if message['role'] == 'system' -%}\n        {%- set ns.found = true -%}\n    {%- endif -%}\n{%- endfor -%}\n{{bos_token}}{%- if not ns.found -%}\n{{'You are an AI programming assistant, utilizing the Deepseek Coder model, developed by Deepseek Company, and you only answer questions related to computer science. For politically sensitive questions, security and privacy issues, and other non-computer science questions, you will refuse to answer\\n'}}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n{{ message['content'] }}\n    {%- else %}\n        {%- if message['role'] == 'user' %}\n{{'### Instruction:\\n' + message['content'] + '\\n'}}\n        {%- else %}\n{{'### Response:\\n' + message['content'] + '\\n<|EOT|>\\n'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{% if add_generation_prompt %}\n{{'### Response:'}}\n{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|EOT|>",
   "model_max_length": 16384,
   "pad_token": "<｜end▁of▁sentence｜>",
   "sp_model_kwargs": {},