models: | |
- model: Nohobby/L3.3-Prikol-70B-v0.5 | |
parameters: | |
select_topk: | |
- filter: mlp | |
value: 0.2 | |
- value: 0.14 | |
- model: NeverSleep/Lumimaid-v0.2-70B | |
parameters: | |
select_topk: | |
- filter: down_proj | |
value: [0.08, 0.06, 0.05, 0.05, 0.04] | |
- value: 0 | |
- model: SicariusSicariiStuff/Negative_LLAMA_70B | |
parameters: | |
select_topk: | |
- filter: self_attn | |
value: 0.08 | |
- filter: "q_proj|k_proj|v_proj" | |
value: 0.08 | |
- filter: "up_proj|down_proj" | |
value: 0.08 | |
- value: 0 | |
- model: d-rang-d/ignore_Siyaniye2 | |
parameters: | |
select_topk: | |
- filter: self_attn | |
value: 0.15 | |
- filter: "q_proj|k_proj|v_proj" | |
value: 0.2 | |
- filter: "up_proj|down_proj" | |
value: 0.1 | |
- filter: mlp | |
value: 0.1 | |
- value: 0.1 | |
merge_method: sce | |
base_model: d-rang-d/ignore_Siyaniye2 | |
dtype: bfloat16 | |
tokenizer: | |
source: Nohobby/L3.3-Prikol-70B-v0.5 |