absorb perm
Browse files- config.json +7 -7
- model.safetensors +2 -2
config.json
CHANGED
@@ -42,7 +42,7 @@
|
|
42 |
"down_proj": {
|
43 |
"bias": false,
|
44 |
"enable_norm": true,
|
45 |
-
"enable_perm":
|
46 |
"group_num": 1,
|
47 |
"group_size": 14336,
|
48 |
"in_features": 14336,
|
@@ -66,7 +66,7 @@
|
|
66 |
"gate_proj": {
|
67 |
"bias": false,
|
68 |
"enable_norm": true,
|
69 |
-
"enable_perm":
|
70 |
"group_num": 1,
|
71 |
"group_size": 4096,
|
72 |
"in_features": 4096,
|
@@ -90,7 +90,7 @@
|
|
90 |
"up_proj": {
|
91 |
"bias": false,
|
92 |
"enable_norm": true,
|
93 |
-
"enable_perm":
|
94 |
"group_num": 1,
|
95 |
"group_size": 4096,
|
96 |
"in_features": 4096,
|
@@ -114,7 +114,7 @@
|
|
114 |
"k_proj": {
|
115 |
"bias": false,
|
116 |
"enable_norm": true,
|
117 |
-
"enable_perm":
|
118 |
"group_num": 1,
|
119 |
"group_size": 4096,
|
120 |
"in_features": 4096,
|
@@ -138,7 +138,7 @@
|
|
138 |
"o_proj": {
|
139 |
"bias": false,
|
140 |
"enable_norm": true,
|
141 |
-
"enable_perm":
|
142 |
"group_num": 1,
|
143 |
"group_size": 4096,
|
144 |
"in_features": 4096,
|
@@ -162,7 +162,7 @@
|
|
162 |
"q_proj": {
|
163 |
"bias": false,
|
164 |
"enable_norm": true,
|
165 |
-
"enable_perm":
|
166 |
"group_num": 1,
|
167 |
"group_size": 4096,
|
168 |
"in_features": 4096,
|
@@ -186,7 +186,7 @@
|
|
186 |
"v_proj": {
|
187 |
"bias": false,
|
188 |
"enable_norm": true,
|
189 |
-
"enable_perm":
|
190 |
"group_num": 1,
|
191 |
"group_size": 4096,
|
192 |
"in_features": 4096,
|
|
|
42 |
"down_proj": {
|
43 |
"bias": false,
|
44 |
"enable_norm": true,
|
45 |
+
"enable_perm": false,
|
46 |
"group_num": 1,
|
47 |
"group_size": 14336,
|
48 |
"in_features": 14336,
|
|
|
66 |
"gate_proj": {
|
67 |
"bias": false,
|
68 |
"enable_norm": true,
|
69 |
+
"enable_perm": false,
|
70 |
"group_num": 1,
|
71 |
"group_size": 4096,
|
72 |
"in_features": 4096,
|
|
|
90 |
"up_proj": {
|
91 |
"bias": false,
|
92 |
"enable_norm": true,
|
93 |
+
"enable_perm": false,
|
94 |
"group_num": 1,
|
95 |
"group_size": 4096,
|
96 |
"in_features": 4096,
|
|
|
114 |
"k_proj": {
|
115 |
"bias": false,
|
116 |
"enable_norm": true,
|
117 |
+
"enable_perm": false,
|
118 |
"group_num": 1,
|
119 |
"group_size": 4096,
|
120 |
"in_features": 4096,
|
|
|
138 |
"o_proj": {
|
139 |
"bias": false,
|
140 |
"enable_norm": true,
|
141 |
+
"enable_perm": false,
|
142 |
"group_num": 1,
|
143 |
"group_size": 4096,
|
144 |
"in_features": 4096,
|
|
|
162 |
"q_proj": {
|
163 |
"bias": false,
|
164 |
"enable_norm": true,
|
165 |
+
"enable_perm": false,
|
166 |
"group_num": 1,
|
167 |
"group_size": 4096,
|
168 |
"in_features": 4096,
|
|
|
186 |
"v_proj": {
|
187 |
"bias": false,
|
188 |
"enable_norm": true,
|
189 |
+
"enable_perm": false,
|
190 |
"group_num": 1,
|
191 |
"group_size": 4096,
|
192 |
"in_features": 4096,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8cc99bc5d06585dd3201a7536d96140446fbdcc6b4d075b5854428f943d8b1e
|
3 |
+
size 4519579120
|