Citaman commited on
Commit
0a19d37
·
verified ·
1 Parent(s): b72732b

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -29,9 +29,9 @@ The following YAML configuration was used to produce this model:
29
  slices:
30
  - sources:
31
  - model: Citaman/command-r-36-layer
32
- layer_range: [0, 34]
33
  - model: Citaman/command-r-36-layer
34
- layer_range: [1, 35]
35
  merge_method: slerp
36
  base_model: Citaman/command-r-36-layer
37
  parameters:
 
29
  slices:
30
  - sources:
31
  - model: Citaman/command-r-36-layer
32
+ layer_range: [0, 35]
33
  - model: Citaman/command-r-36-layer
34
+ layer_range: [1, 36]
35
  merge_method: slerp
36
  base_model: Citaman/command-r-36-layer
37
  parameters:
config.json CHANGED
@@ -17,7 +17,7 @@
17
  "model_max_length": 131072,
18
  "model_type": "cohere",
19
  "num_attention_heads": 64,
20
- "num_hidden_layers": 34,
21
  "num_key_value_heads": 64,
22
  "pad_token_id": 0,
23
  "pretraining_tp": 1,
 
17
  "model_max_length": 131072,
18
  "model_type": "cohere",
19
  "num_attention_heads": 64,
20
+ "num_hidden_layers": 35,
21
  "num_key_value_heads": 64,
22
  "pad_token_id": 0,
23
  "pretraining_tp": 1,
mergekit_config.yml CHANGED
@@ -1,9 +1,9 @@
1
  slices:
2
  - sources:
3
  - model: Citaman/command-r-36-layer
4
- layer_range: [0, 34]
5
  - model: Citaman/command-r-36-layer
6
- layer_range: [1, 35]
7
  merge_method: slerp
8
  base_model: Citaman/command-r-36-layer
9
  parameters:
 
1
  slices:
2
  - sources:
3
  - model: Citaman/command-r-36-layer
4
+ layer_range: [0, 35]
5
  - model: Citaman/command-r-36-layer
6
+ layer_range: [1, 36]
7
  merge_method: slerp
8
  base_model: Citaman/command-r-36-layer
9
  parameters:
model-00003-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de180ac1cbbc2df1dc17e2b0c53eddd324da58172746ec8a7b72f857d37e9074
3
- size 9831552200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a0c3e6049986a34ac86227129e19ac2e6495b604cacc3f12f405b1de64ca916
3
+ size 9999324720
model-00004-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f8ca0453495ab9c4af6d31e741d8f0abaa7e848443d558fa821a2de44710ca1
3
- size 9932281376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3966bfc65ef526f80cc7f59c094b88cd10eb41c1e56e793b9d69fde8b5c637f9
3
+ size 9898693712
model-00005-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af4f861475b120711951c054d72c6d4eba53e0b345cac4e766cd74f6628e5714
3
- size 9663764064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ce8f59130108f22d447d94997782c1519ac922460f576b3d993f6629a1f0d3e
3
+ size 9697350896
model-00006-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cb1a16ddba0c919fe65529338669613fa93550d0a275c4fdc2442b639556fe6
3
- size 9865122576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a661889aa282f0305160b2991e914da4c4c8bc02cc8c8a399a751ce8798d0a0
3
+ size 9697350896
model-00007-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae3ae1e1c98175d9d3c140b3785c58bc77ad395f5f80ead3a944ae21373d10e5
3
- size 5335239160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecf8940729c73d20f49da96a23f4b7bb43ca1c031c45671bc2a27e09e0b05175
3
+ size 6979423640
model.safetensors.index.json CHANGED
@@ -1 +1 @@
1
- {"metadata": {"mergekit_version": "0.0.4.2", "total_size": 64290865152}, "weight_map": {"lm_head.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.embed_tokens.weight": "model-00001-of-00007.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.down_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.input_layernorm.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.input_layernorm.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.9.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.9.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.21.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.21.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.20.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.15.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.15.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.norm.weight": "model-00004-of-00007.safetensors", "model.layers.33.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.33.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.33.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.27.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.27.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.26.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.26.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.26.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.26.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.25.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.25.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.25.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.25.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.24.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.24.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.24.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.32.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.32.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.30.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.30.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.30.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.30.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.30.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.30.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.30.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.o_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.v_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.q_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.input_layernorm.weight": "model-00007-of-00007.safetensors"}}
 
1
+ {"metadata": {"mergekit_version": "0.0.4.2", "total_size": 65935048704}, "weight_map": {"lm_head.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", "model.embed_tokens.weight": "model-00001-of-00007.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.mlp.down_proj.weight": "model-00002-of-00007.safetensors", "model.layers.3.input_layernorm.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00002-of-00007.safetensors", "model.layers.0.input_layernorm.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.28.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", "model.layers.27.mlp.up_proj.weight": "model-00002-of-00007.safetensors", "model.layers.21.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.9.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.9.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.6.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.5.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.4.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.2.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.mlp.down_proj.weight": "model-00003-of-00007.safetensors", "model.layers.1.input_layernorm.weight": "model-00003-of-00007.safetensors", "model.layers.34.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.34.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.34.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.34.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", "model.layers.33.mlp.up_proj.weight": "model-00003-of-00007.safetensors", "model.layers.27.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.15.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.15.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.14.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.13.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.12.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.11.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.10.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.8.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.7.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.norm.weight": "model-00004-of-00007.safetensors", "model.layers.34.mlp.up_proj.weight": "model-00004-of-00007.safetensors", "model.layers.34.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.34.mlp.down_proj.weight": "model-00004-of-00007.safetensors", "model.layers.34.input_layernorm.weight": "model-00004-of-00007.safetensors", "model.layers.33.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", "model.layers.33.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.33.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.21.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.21.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.20.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.19.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.18.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.17.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.16.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.14.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.mlp.down_proj.weight": "model-00005-of-00007.safetensors", "model.layers.13.input_layernorm.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.mlp.up_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", "model.layers.32.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.32.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.27.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.27.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.26.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.26.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.26.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.26.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.25.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.25.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.25.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.25.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.24.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.23.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.22.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.20.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.mlp.down_proj.weight": "model-00006-of-00007.safetensors", "model.layers.19.input_layernorm.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.up_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", "model.layers.31.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.31.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.30.self_attn.o_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.self_attn.v_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.self_attn.q_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.30.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.o_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.v_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.self_attn.q_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.29.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.28.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.26.input_layernorm.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.up_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.gate_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.mlp.down_proj.weight": "model-00007-of-00007.safetensors", "model.layers.25.input_layernorm.weight": "model-00007-of-00007.safetensors"}}