hotmailuser commited on
Commit
25bea3c
·
verified ·
1 Parent(s): 60392df

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -1,14 +1,14 @@
1
  ---
2
  base_model:
3
- - Youlln/ECE-PRYMMAL-0.5B-SLERP-V4
4
- - Youlln/ECE-PRYMMAL-0.5B-SLERP-V3
5
  - Qwen/Qwen2-0.5B-Instruct
6
- - Youlln/ECE-PRYMMAL-0.5B-SLERP-V2
 
7
  library_name: transformers
8
  tags:
9
  - mergekit
10
  - merge
11
- license: apache-2.0
12
  ---
13
  # merge
14
 
@@ -22,9 +22,9 @@ This model was merged using the [Model Stock](https://arxiv.org/abs/2403.19522)
22
  ### Models Merged
23
 
24
  The following models were included in the merge:
25
- * [Youlln/ECE-PRYMMAL-0.5B-SLERP-V4](https://huggingface.co/Youlln/ECE-PRYMMAL-0.5B-SLERP-V4)
26
- * [Youlln/ECE-PRYMMAL-0.5B-SLERP-V3](https://huggingface.co/Youlln/ECE-PRYMMAL-0.5B-SLERP-V3)
27
- * [Youlln/ECE-PRYMMAL-0.5B-SLERP-V2](https://huggingface.co/Youlln/ECE-PRYMMAL-0.5B-SLERP-V2)
28
 
29
  ### Configuration
30
 
@@ -32,13 +32,13 @@ The following YAML configuration was used to produce this model:
32
 
33
  ```yaml
34
  models:
35
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V2
36
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V3
37
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V4
38
  base_model: Qwen/Qwen2-0.5B-Instruct
39
  merge_method: model_stock
40
  parameters:
41
  normalize: true
42
- dtype: bfloat16
43
 
44
- ```
 
1
  ---
2
  base_model:
3
+ - Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR
 
4
  - Qwen/Qwen2-0.5B-Instruct
5
+ - Youlln/ECE.EIFFEIL.ia-0.5B-SLERP
6
+ - Youlln/ECE-PRYMMAL-0.5B-FT-V3
7
  library_name: transformers
8
  tags:
9
  - mergekit
10
  - merge
11
+
12
  ---
13
  # merge
14
 
 
22
  ### Models Merged
23
 
24
  The following models were included in the merge:
25
+ * [Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR](https://huggingface.co/Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR)
26
+ * [Youlln/ECE.EIFFEIL.ia-0.5B-SLERP](https://huggingface.co/Youlln/ECE.EIFFEIL.ia-0.5B-SLERP)
27
+ * [Youlln/ECE-PRYMMAL-0.5B-FT-V3](https://huggingface.co/Youlln/ECE-PRYMMAL-0.5B-FT-V3)
28
 
29
  ### Configuration
30
 
 
32
 
33
  ```yaml
34
  models:
35
+ - model: Youlln/ECE.EIFFEIL.ia-0.5B-SLERP
36
+ - model: Youlln/ECE-PRYMMAL-0.5B-FT-V3
37
+ - model: Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR
38
  base_model: Qwen/Qwen2-0.5B-Instruct
39
  merge_method: model_stock
40
  parameters:
41
  normalize: true
42
+ dtype: float16
43
 
44
+ ```
config.json CHANGED
@@ -21,7 +21,7 @@
21
  "rope_theta": 1000000.0,
22
  "sliding_window": null,
23
  "tie_word_embeddings": true,
24
- "torch_dtype": "bfloat16",
25
  "transformers_version": "4.46.2",
26
  "use_cache": true,
27
  "use_sliding_window": false,
 
21
  "rope_theta": 1000000.0,
22
  "sliding_window": null,
23
  "tie_word_embeddings": true,
24
+ "torch_dtype": "float16",
25
  "transformers_version": "4.46.2",
26
  "use_cache": true,
27
  "use_sliding_window": false,
mergekit_config.yml CHANGED
@@ -1,9 +1,9 @@
1
  models:
2
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V2
3
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V3
4
- - model: Youlln/ECE-PRYMMAL-0.5B-SLERP-V4
5
  base_model: Qwen/Qwen2-0.5B-Instruct
6
  merge_method: model_stock
7
  parameters:
8
  normalize: true
9
- dtype: bfloat16
 
1
  models:
2
+ - model: Youlln/ECE.EIFFEIL.ia-0.5B-SLERP
3
+ - model: Youlln/ECE-PRYMMAL-0.5B-FT-V3
4
+ - model: Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR
5
  base_model: Qwen/Qwen2-0.5B-Instruct
6
  merge_method: model_stock
7
  parameters:
8
  normalize: true
9
+ dtype: float16
model-00001-of-00001.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11c2f69d6e174917fceab134dfd5e56ddabc1374b252a9f8ddcfefee9f13625f
3
- size 1260367448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c0fdc4873a96700bd691d9824cdd3f965a3cbfe64ef63b1e1a4fe51d2eabdef
3
+ size 1260367152