Llama-3.1-8B-Squareroot-v0 / mergekit_config.yml
3rd-Degree-Burn's picture
Upload folder using huggingface_hub
dcdcb91 verified
raw
history blame
625 Bytes
models:
- model: NousResearch/Meta-Llama-3.1-8B-Instruct # instruct model
parameters:
density: [1, 0.8, 0.5]
weight: 1.0
- model: EpistemeAI/Fireball-Alpaca-Llama3.1.07-8B-Philos-Math-KTO-beta # Reasoning/Logic model
parameters:
density: [0.9, 0.6, 0.4]
weight: [0.3, 0.6, 0.9]
- model: nvidia/OpenMath2-Llama3.1-8B # Math model
parameters:
density: 0.7
weight:
- filter: mlp
value: 0.7
- value: 0.3
merge_method: ties
base_model: vicgalle/Configurable-Llama-3.1-8B-Instruct # General base model
parameters:
normalize: true
dtype: float16