apepkuss79 commited on
Commit
8736848
1 Parent(s): 86582f2

Update models

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Qwen2.5-0.5B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Qwen2.5-0.5B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Qwen2.5-0.5B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Qwen2.5-0.5B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Qwen2.5-0.5B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Qwen2.5-0.5B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Qwen2.5-0.5B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Qwen2.5-0.5B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Qwen2.5-0.5B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Qwen2.5-0.5B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Qwen2.5-0.5B-Instruct-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Qwen2.5-0.5B-Instruct-f16.gguf filter=lfs diff=lfs merge=lfs -text
Qwen2.5-0.5B-Instruct-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a744b4beab939d899e22c8a070b7041a275582fb942483c9436d455173c7e23d
3
+ size 338607424
Qwen2.5-0.5B-Instruct-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa94cfe9e51e3ec01a2bbdb2828dd64716a8e7751ec9cb16bd99151c8261651
3
+ size 369358144
Qwen2.5-0.5B-Instruct-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5abe04c0c7ab2eb6313d2a3a669e0d2e27971630b3d2dc0183b0e64f01597d79
3
+ size 355466560
Qwen2.5-0.5B-Instruct-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5845bdfe86402b6fe7154e1436941c58167a667a7fb476adf5bd8112a8c4f6
3
+ size 338263360
Qwen2.5-0.5B-Instruct-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:242af9ee5029ac7261f3b0e50cf0c81a43a906fa48546a40a09c7e2f28f0ce16
3
+ size 352154944
Qwen2.5-0.5B-Instruct-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9c0d231b0254800f96cc58be8818ea5df96dbcf77c6f67f76b130267a4c35f2
3
+ size 397807936
Qwen2.5-0.5B-Instruct-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:accd05ae3f684ecba9ba373b752d9c79759272d6bb4567bb81597b8886aac016
3
+ size 385471808
Qwen2.5-0.5B-Instruct-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fedd9a813195cd3fe5eaec701532bae0cadb0ae2971aaecff12fb0c60798e7c
3
+ size 396883264
Qwen2.5-0.5B-Instruct-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3770ca0aa82dfcfbb7747713f88237be7867829afe7621a9fb117a28efeacfb6
3
+ size 412710208
Qwen2.5-0.5B-Instruct-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:526ade7343ce34f493ff03c6231e82d78f1eab59284541c3530fc4285911d641
3
+ size 505736512
Qwen2.5-0.5B-Instruct-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4829649671bf775152642cfbbe771ef8b87a68a94e31a8e8995e1c6e5167edb2
3
+ size 531068224
Qwen2.5-0.5B-Instruct-f16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f96e01a3f550ca08aea1e5725bb8d5a7eccc6f281c30417e9d380b8c46467bd
3
+ size 994156864
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2ForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 151643,
7
+ "eos_token_id": 151645,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 896,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 4864,
12
+ "max_position_embeddings": 32768,
13
+ "max_window_layers": 21,
14
+ "model_type": "qwen2",
15
+ "num_attention_heads": 14,
16
+ "num_hidden_layers": 24,
17
+ "num_key_value_heads": 2,
18
+ "rms_norm_eps": 1e-06,
19
+ "rope_theta": 1000000.0,
20
+ "sliding_window": 32768,
21
+ "tie_word_embeddings": true,
22
+ "torch_dtype": "bfloat16",
23
+ "transformers_version": "4.43.1",
24
+ "use_cache": true,
25
+ "use_sliding_window": false,
26
+ "vocab_size": 151936
27
+ }