Deepseek-EVA-32B-SCE-v1 / mergekit_config.yml
Downtown-Case's picture
Upload folder using huggingface_hub
52946db verified
raw
history blame contribute delete
440 Bytes
models:
- model: /home/alpha/Models/Raw/Qwen_Qwen2.5-32B
# No parameters necessary for base model
- model: /home/alpha/Models/Raw/nbeerbower_EVA-Gutenberg3-Qwen2.5-32B
- model: /home/alpha/Models/Raw/deepseek-ai_DeepSeek-R1-Distill-Qwen-32B
merge_method: sce
tokenizer:
source: "union"
base_model: /home/alpha/Models/Raw/Qwen_Qwen2.5-32B
chat_template: "deepseek"
parameters:
int8_mask: true
select_topk: 0.30
dtype: bfloat16