Upload 2 files
Browse filesVery early layerskip-aware weights
.gitattributes
CHANGED
@@ -17,3 +17,4 @@ loras/ckpt/lora-cyberpunk-silverhand-r128-a128/lora.sft filter=lfs diff=lfs merg
|
|
17 |
loras/ckpt/lora-cyberpunk-takemura-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
18 |
loras/ckpt/lora-portal-glados-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
19 |
loras/ckpt/lora-samandmax-sam-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
|
|
|
17 |
loras/ckpt/lora-cyberpunk-takemura-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
18 |
loras/ckpt/lora-portal-glados-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
19 |
loras/ckpt/lora-samandmax-sam-r128-a128/lora.sft filter=lfs diff=lfs merge=lfs -text
|
20 |
+
models/ckpt/ar+nar-layerskip-llama-8/fp32.sft filter=lfs diff=lfs merge=lfs -text
|
models/ckpt/ar+nar-layerskip-llama-8/fp32.sft
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:232e0cec837102824e5d8b19cd4d3a138566aa7b9f048fa7c48049c5398e0677
|
3 |
+
size 456274634
|
models/config.llama[layerskip].yaml
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- name: "ar+nar-layerskip"
|
3 |
+
size: "full"
|
4 |
+
resp_levels: 8
|
5 |
+
tasks: 9
|
6 |
+
langs: 4
|
7 |
+
tones: 1
|
8 |
+
arch_type: llama
|
9 |
+
attention: auto
|
10 |
+
version: 5
|
11 |
+
|
12 |
+
capabilities: ["ar", "nar"]
|
13 |
+
experimental:
|
14 |
+
split_classifiers: True
|
15 |
+
audio_embedding_sums: True
|
16 |
+
unified_position_ids: False
|
17 |
+
layerskip: True
|