models: - model: Qwen/Qwen2.5-Math-1.5B-Instruct parameters: weight: 0.4 - model: ../../skywork-o1-prm-inference/new_model_path parameters: weight: 0.6 merge_method: linear dtype: float16