awni commited on
Commit
10f31ed
·
verified ·
1 Parent(s): 989e512

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +33 -0
  2. config.json +69 -0
  3. model-00001-of-00070.safetensors +3 -0
  4. model-00002-of-00070.safetensors +3 -0
  5. model-00003-of-00070.safetensors +3 -0
  6. model-00004-of-00070.safetensors +3 -0
  7. model-00005-of-00070.safetensors +3 -0
  8. model-00006-of-00070.safetensors +3 -0
  9. model-00007-of-00070.safetensors +3 -0
  10. model-00008-of-00070.safetensors +3 -0
  11. model-00009-of-00070.safetensors +3 -0
  12. model-00010-of-00070.safetensors +3 -0
  13. model-00011-of-00070.safetensors +3 -0
  14. model-00012-of-00070.safetensors +3 -0
  15. model-00013-of-00070.safetensors +3 -0
  16. model-00014-of-00070.safetensors +3 -0
  17. model-00015-of-00070.safetensors +3 -0
  18. model-00016-of-00070.safetensors +3 -0
  19. model-00017-of-00070.safetensors +3 -0
  20. model-00018-of-00070.safetensors +3 -0
  21. model-00019-of-00070.safetensors +3 -0
  22. model-00020-of-00070.safetensors +3 -0
  23. model-00021-of-00070.safetensors +3 -0
  24. model-00022-of-00070.safetensors +3 -0
  25. model-00023-of-00070.safetensors +3 -0
  26. model-00024-of-00070.safetensors +3 -0
  27. model-00025-of-00070.safetensors +3 -0
  28. model-00026-of-00070.safetensors +3 -0
  29. model-00027-of-00070.safetensors +3 -0
  30. model-00028-of-00070.safetensors +3 -0
  31. model-00029-of-00070.safetensors +3 -0
  32. model-00030-of-00070.safetensors +3 -0
  33. model-00031-of-00070.safetensors +3 -0
  34. model-00032-of-00070.safetensors +3 -0
  35. model-00033-of-00070.safetensors +3 -0
  36. model-00034-of-00070.safetensors +3 -0
  37. model-00035-of-00070.safetensors +3 -0
  38. model-00036-of-00070.safetensors +3 -0
  39. model-00037-of-00070.safetensors +3 -0
  40. model-00038-of-00070.safetensors +3 -0
  41. model-00039-of-00070.safetensors +3 -0
  42. model-00040-of-00070.safetensors +3 -0
  43. model-00041-of-00070.safetensors +3 -0
  44. model-00042-of-00070.safetensors +3 -0
  45. model-00043-of-00070.safetensors +3 -0
  46. model-00044-of-00070.safetensors +3 -0
  47. model-00045-of-00070.safetensors +3 -0
  48. model-00046-of-00070.safetensors +3 -0
  49. model-00047-of-00070.safetensors +3 -0
  50. model-00048-of-00070.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: deepseek-ai/DeepSeek-V3
3
+ tags:
4
+ - mlx
5
+ ---
6
+
7
+ # mlx-community/DeepSeek-V3-3bit-bf16
8
+
9
+ The Model [mlx-community/DeepSeek-V3-3bit-bf16](https://huggingface.co/mlx-community/DeepSeek-V3-3bit-bf16) was
10
+ converted to MLX format from [deepseek-ai/DeepSeek-V3](https://huggingface.co/deepseek-ai/DeepSeek-V3)
11
+ using mlx-lm version **0.20.4**.
12
+
13
+ ## Use with mlx
14
+
15
+ ```bash
16
+ pip install mlx-lm
17
+ ```
18
+
19
+ ```python
20
+ from mlx_lm import load, generate
21
+
22
+ model, tokenizer = load("mlx-community/DeepSeek-V3-3bit-bf16")
23
+
24
+ prompt = "hello"
25
+
26
+ if tokenizer.chat_template is not None:
27
+ messages = [{"role": "user", "content": prompt}]
28
+ prompt = tokenizer.apply_chat_template(
29
+ messages, add_generation_prompt=True
30
+ )
31
+
32
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
33
+ ```
config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_deepseek.DeepseekV3Config",
9
+ "AutoModel": "modeling_deepseek.DeepseekV3Model",
10
+ "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
11
+ },
12
+ "aux_loss_alpha": 0.001,
13
+ "bos_token_id": 0,
14
+ "eos_token_id": 1,
15
+ "ep_size": 1,
16
+ "first_k_dense_replace": 3,
17
+ "hidden_act": "silu",
18
+ "hidden_size": 7168,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 18432,
21
+ "kv_lora_rank": 512,
22
+ "max_position_embeddings": 163840,
23
+ "model_type": "deepseek_v3",
24
+ "moe_intermediate_size": 2048,
25
+ "moe_layer_freq": 1,
26
+ "n_group": 8,
27
+ "n_routed_experts": 256,
28
+ "n_shared_experts": 1,
29
+ "norm_topk_prob": true,
30
+ "num_attention_heads": 128,
31
+ "num_experts_per_tok": 8,
32
+ "num_hidden_layers": 61,
33
+ "num_key_value_heads": 128,
34
+ "num_nextn_predict_layers": 1,
35
+ "pretraining_tp": 1,
36
+ "q_lora_rank": 1536,
37
+ "qk_nope_head_dim": 128,
38
+ "qk_rope_head_dim": 64,
39
+ "quantization": {
40
+ "group_size": 32,
41
+ "bits": 3
42
+ },
43
+ "quantization_config": {
44
+ "group_size": 32,
45
+ "bits": 3
46
+ },
47
+ "rms_norm_eps": 1e-06,
48
+ "rope_scaling": {
49
+ "beta_fast": 32,
50
+ "beta_slow": 1,
51
+ "factor": 40,
52
+ "mscale": 1.0,
53
+ "mscale_all_dim": 1.0,
54
+ "original_max_position_embeddings": 4096,
55
+ "type": "yarn"
56
+ },
57
+ "rope_theta": 10000,
58
+ "routed_scaling_factor": 2.5,
59
+ "scoring_func": "sigmoid",
60
+ "seq_aux": true,
61
+ "tie_word_embeddings": false,
62
+ "topk_group": 4,
63
+ "topk_method": "noaux_tc",
64
+ "torch_dtype": "bfloat16",
65
+ "transformers_version": "4.33.1",
66
+ "use_cache": true,
67
+ "v_head_dim": 128,
68
+ "vocab_size": 129280
69
+ }
model-00001-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec12eb853ea78e85423aa20479bf8a408dd0d5bce8d5da61c92024bd5b5ff476
3
+ size 5190304394
model-00002-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad7d87f5f98469a5b9204fe2c1de2fa2190fbef97e33e78a427159b1c4f4871e
3
+ size 5286663108
model-00003-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34d6107a9d940862650da2c4ce19b44f9a7c3cdd9603ddb414cdb56d55106e82
3
+ size 4347139139
model-00004-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853dc4907b7f953908dadd687eaf80984ed44c0762e5a5f7b0238fc565724f56
3
+ size 5286663106
model-00005-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47e483fb8585e4554375b3807afa621ad469559f8104c28b2ebc4e31615dfccc
3
+ size 4347139091
model-00006-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1358e4743925162d3466be786e3a15e3e126828393619880038194d7980ee612
3
+ size 5167383445
model-00007-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52c2aff57d51ff9042deea28431c589d8488f7c441da603f925f1fcddf667145
3
+ size 4347139137
model-00008-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c306dc6ef99aac4bea26c1a806a8b00361f83633807764803ac88bddcb5c66d
3
+ size 5286663110
model-00009-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62b375fe5e33eaadd1740699fd3606d52a7efb036b0619cdd6695af46c8cb2e4
3
+ size 4347139159
model-00010-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c563b89a7bfa257421c16d66431c924e655a7851806f50118f83949271ad8fcb
3
+ size 5286663095
model-00011-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:524eaf86260bbab31891717ff0b51d37701ddb7a50d0dc47aaf1a8c68f15edea
3
+ size 4347139087
model-00012-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cf7d36d25bc361456e019ea5f4b420da180f47bdf6df65ad4292f33fa03152
3
+ size 5167383454
model-00013-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25890a6fcabc63a7de925014fa5780e7199ba561696613c2a08f9e58e609f248
3
+ size 4347139157
model-00014-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f64b15968af0dd5da8fbd496b5a3bcf0820f5b5239eee1e9399d2c33b8cc56cf
3
+ size 5286663109
model-00015-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fc747b202dd0884fbb9bc5a0792888fb5a6e046f675ca0941b741a4e6cad00f
3
+ size 4347139145
model-00016-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42651b179ffd87ac9c0e4d0f179363f37ad9233e57251adcb70867dea28bfa30
3
+ size 5286663143
model-00017-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ce19658413e02cbfd7a9144f95daaa10c90194120eda4e6752e00011a325bb
3
+ size 4347139101
model-00018-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ec446a846a3d8dd77d53437fc8317e59dad9966c0f89f93ecc3db70c0e33e95
3
+ size 5167383454
model-00019-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b3871185235b38a244787ca141980cff528a9123c01dcc84613d18484c5267b
3
+ size 4347139143
model-00020-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bba65e0f87107b4b4577b0f1bf70044f7d60e01a90fc2f403690fecf7e70a6dd
3
+ size 5286663143
model-00021-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20126dd5b8c0c4a274b8ec510dd6b5844649a5f91283df7a57432c0ebf69a883
3
+ size 4347139175
model-00022-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a124956807e7a79ca1f192273f2db415927d8b0b65c7dbe3f1e2430fa2fc8005
3
+ size 5286663069
model-00023-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77d8d9066d68277ffa003ac877194d5e85f3209ef9df03e0148a45e9fc77602e
3
+ size 4347139067
model-00024-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b704afb0ec2123d374d4bacb02b1d9552a04d0b815115ccce9f05f39e9da489
3
+ size 5167383450
model-00025-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae06a62cfeac90d803b4de91679cf6dc0cc2277a334d5f389b3014e4b1ae669
3
+ size 4347139175
model-00026-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a83f862940d2b652d72199fe77c77fdfef9d04e1c41b6cb0722e276c1516d850
3
+ size 5286663109
model-00027-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40494c9bf35a6b9bc9e413da64b3ee4a5111621fb1b9c2bb36e44f0681178c52
3
+ size 4347139129
model-00028-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90494c70b544f355b950ebb5b9e64e5e80a1c3cc3a19e36060f6778ea56a9fbe
3
+ size 5286663059
model-00029-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ea7dbfa220f3bfbfb732bdcfa9ad838808cf4054c84902153545e6ec6e7eed0
3
+ size 4347139101
model-00030-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d059ed62d419e872f85e074c00336e71a1b5c2e12c2624fa099a241562e255e
3
+ size 5167383454
model-00031-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca81c7ad2a543a94d52cd7f7c0f1ee9ac5dc38a34d3c8e0c763ce03530aff90
3
+ size 4347139175
model-00032-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60c447a13bdd6618eb28e2241b815525d92cf83f6ff48334620f451f438d2a51
3
+ size 5286663133
model-00033-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25f074c4da207dd4c52cf3abc881301bfb95534d76b447e4517dfa7c5e195e08
3
+ size 4347139177
model-00034-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbe371abf5a7d4aa9187c4696f5dd28a2ff702e12deff504523ec7eb6294413e
3
+ size 5286663143
model-00035-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8044e76dfdc7723d934febe9d2065d3fb90d92e91ba546d14f0771c4a55e648f
3
+ size 4347139119
model-00036-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6499f1e97d168e1acd9fc33c8fa3c06b49c6537eab9196732fe6cde9e413a4
3
+ size 5167383452
model-00037-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f3faea2b9514cf1c7e4fb26fef3a63f09d81b250ce0b937f5fabb229c3fc5db
3
+ size 4347139169
model-00038-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a385254825371ee9825e7749538c0be9c88910475fe049a1191cfc286d085423
3
+ size 5286663139
model-00039-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1643472b4cbf7366b73ee5bd099dc5f7d6818fb0813fe8cb4aae909a188fa288
3
+ size 4347139137
model-00040-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a13ff7315056846b82e9ca3fff73de41602a6e978238a13ec8ff14b6b77c4151
3
+ size 5286663143
model-00041-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6e4d397a03006e73f41a7739616e654e4be359cd616b5caa10841dc2ffef1a
3
+ size 4347139081
model-00042-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:add8ac5d141e3396813004b91ddb7821a0f58ebaf6ee4bdff750953d15b0e8c9
3
+ size 5167383454
model-00043-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdef1e67a40f90804e64bf12f6a0ebc227a4c60beeab0371206fdca3c2ba040d
3
+ size 4347139173
model-00044-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a04a2d7d8354b02e7ec6fc69a1eaf6f32963542b907061144b1836c6e08d3bf8
3
+ size 5286663099
model-00045-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a640daf6c55a62632a9241482032ee171b65ad8bf7d6cca04a430954f732a1b
3
+ size 4347139135
model-00046-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5ee5ccb9dc73fd5bb48bb7762fa0c0ca3330e583bb5bbf0c90e47a84fcee195
3
+ size 5286663143
model-00047-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19e74307f880c4cfabbe19a25abc0657522b6972dac51f4f04778dd341b13e56
3
+ size 4347139109
model-00048-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9ac35a21fc3eed20497bc34e82317ada1c8890477b92e43ef6d6022017966b
3
+ size 5167383454