Update README.md
Browse files
README.md
CHANGED
@@ -11,7 +11,7 @@ tags:
|
|
11 |
- merge
|
12 |
|
13 |
---
|
14 |
-
#
|
15 |
|
16 |
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
17 |
|
@@ -35,20 +35,15 @@ The following YAML configuration was used to produce this model:
|
|
35 |
```yaml
|
36 |
models:
|
37 |
# Pivot model
|
38 |
-
|
39 |
# Target models
|
40 |
- model: Qwen/Qwen2.5-14B-Instruct
|
41 |
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
42 |
- model: arcee-ai/Virtuoso-Small-v2
|
43 |
-
- model: arcee-ai/SuperNova-Medius
|
44 |
- model: Krystalan/DRT-o1-14B
|
45 |
merge_method: sce
|
46 |
base_model: arcee-ai/SuperNova-Medius
|
47 |
-
# Qwen/Qwen2.5-14B
|
48 |
tokenizer_source: base
|
49 |
-
# arcee-ai/Virtuoso-Small-v2
|
50 |
-
# Qwen/Qwen2.5-14B
|
51 |
-
# deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
52 |
parameters:
|
53 |
select_topk: 1.0
|
54 |
dtype: bfloat16
|
|
|
11 |
- merge
|
12 |
|
13 |
---
|
14 |
+
# CoderO1-14B-Preview
|
15 |
|
16 |
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
17 |
|
|
|
35 |
```yaml
|
36 |
models:
|
37 |
# Pivot model
|
38 |
+
- model: arcee-ai/SuperNova-Medius
|
39 |
# Target models
|
40 |
- model: Qwen/Qwen2.5-14B-Instruct
|
41 |
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
42 |
- model: arcee-ai/Virtuoso-Small-v2
|
|
|
43 |
- model: Krystalan/DRT-o1-14B
|
44 |
merge_method: sce
|
45 |
base_model: arcee-ai/SuperNova-Medius
|
|
|
46 |
tokenizer_source: base
|
|
|
|
|
|
|
47 |
parameters:
|
48 |
select_topk: 1.0
|
49 |
dtype: bfloat16
|