base_model: Qwen/Qwen2.5-Coder-0.5B-Instruct # ベースモデルの指定 | |
slices: | |
- sources: | |
- model: Qwen/Qwen2.5-Coder-0.5B-Instruct | |
layer_range: [0, 23] | |
- model: Hachipo/qwen2.5-0.5B_ichikara_4802 | |
layer_range: [0, 23] | |
target_layer_range: [0, 23] | |
merge_method: slerp | |
parameters: | |
t: | |
- filter: self_attn | |
value: [0.5] # SLERP の補間係数 | |
- filter: mlp | |
value: [0.5] | |
- value: 0.5 | |
dtype: float32 | |