可亲 commited on
Commit
688e28d
1 Parent(s): 0cb5bb4

fix(pad zero) pad intermediate_size to 29696 to make sure quantized model can use 8 tensor-parallel in vllm

Browse files
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,20 +1,16 @@
1
  {
2
- "_name_or_path": "Qwen/Qwen2-VL-72B-Instruct-AWQ",
3
  "architectures": [
4
  "Qwen2VLForConditionalGeneration"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
  "eos_token_id": 151645,
9
- "vision_start_token_id": 151652,
10
- "vision_end_token_id": 151653,
11
- "vision_token_id": 151654,
12
- "image_token_id": 151655,
13
- "video_token_id": 151656,
14
  "hidden_act": "silu",
15
  "hidden_size": 8192,
 
16
  "initializer_range": 0.02,
17
- "intermediate_size": 29568,
18
  "max_position_embeddings": 32768,
19
  "max_window_layers": 80,
20
  "model_type": "qwen2_vl",
@@ -47,17 +43,15 @@
47
  "transformers_version": "4.45.0.dev0",
48
  "use_cache": true,
49
  "use_sliding_window": false,
 
50
  "vision_config": {
51
- "depth": 32,
52
- "embed_dim": 1280,
53
- "mlp_ratio": 4,
54
- "num_heads": 16,
55
- "in_chans": 3,
56
  "hidden_size": 8192,
57
- "patch_size": 14,
58
- "spatial_merge_size": 2,
59
- "spatial_patch_size": 14,
60
- "temporal_patch_size": 2
61
  },
 
 
 
62
  "vocab_size": 152064
63
  }
 
1
  {
2
+ "_name_or_path": "Qwen/Qwen2-VL-72B-Instruct-315-fix-dim-pad",
3
  "architectures": [
4
  "Qwen2VLForConditionalGeneration"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
  "eos_token_id": 151645,
 
 
 
 
 
9
  "hidden_act": "silu",
10
  "hidden_size": 8192,
11
+ "image_token_id": 151655,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 29696,
14
  "max_position_embeddings": 32768,
15
  "max_window_layers": 80,
16
  "model_type": "qwen2_vl",
 
43
  "transformers_version": "4.45.0.dev0",
44
  "use_cache": true,
45
  "use_sliding_window": false,
46
+ "video_token_id": 151656,
47
  "vision_config": {
 
 
 
 
 
48
  "hidden_size": 8192,
49
+ "in_chans": 3,
50
+ "model_type": "qwen2_vl",
51
+ "spatial_patch_size": 14
 
52
  },
53
+ "vision_end_token_id": 151653,
54
+ "vision_start_token_id": 151652,
55
+ "vision_token_id": 151654,
56
  "vocab_size": 152064
57
  }
generation_config.json CHANGED
@@ -1,13 +1,11 @@
1
  {
2
- "bos_token_id": 151643,
3
- "pad_token_id": 151643,
4
  "do_sample": true,
5
- "eos_token_id": [
6
- 151645,
7
- 151643
8
- ],
9
- "repetition_penalty": 1.05,
10
- "top_p": 0.001,
11
- "top_k": 1,
12
  "transformers_version": "4.45.0.dev0"
13
  }
 
1
  {
2
+ "chat_format": "chatml",
 
3
  "do_sample": true,
4
+ "eos_token_id": 151643,
5
+ "max_new_tokens": 512,
6
+ "max_window_size": 6144,
7
+ "pad_token_id": 151643,
8
+ "top_k": 0,
9
+ "top_p": 0.01,
 
10
  "transformers_version": "4.45.0.dev0"
11
  }
model-00001-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb053403e32f0f170f1cf34c593f32c6277cb8c128dca6d13d96b0a5e5488d05
3
- size 3968639512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdacf90b517828c5ff867ea246182475ef74bdc71e1f94bccb363a8e84163b93
3
+ size 1221591040
model-00002-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:833322e4ad4577970c2780fc680c1032fbe111377e50fd3282a74b1f18ec26fb
3
- size 3899899496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae13b4b0707ae2d71a2dc438ce31ab561edd772990e874bf7d3a65a007c23f8c
3
+ size 3914063464
model-00003-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4abd7986db5540fa8983232efd26ef51b7cf2ecbe2517b2171902dc07a0aade
3
- size 3978401464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fcf53da5c2ff57ea36d9267025b50cf1567d3a6e2cab30361118078d494e910
3
+ size 3992565432
model-00004-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe2cba911774e1791578d3243d35a1288106ccface9cc1d742ba5a62d766811c
3
- size 3978401504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8e5d6ebd7faf0358ffd638d3ad82ac69a4da852d7677aa2b1ba3ef8d4436d2
3
+ size 3992565472
model-00005-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d95c1e33983b475b72e1273900f63a4a9fd50fc004f650cd424e2c21256e616b
3
- size 3899899712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc264ea4aedcd0699307e1e66981edb6c5a3fdb06e7d4e193b0a01590b351878
3
+ size 3914063680
model-00006-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab50438ebcb0cd8f49bbfa6e7451a7e2663b683858488a122b485c0d93fc0579
3
- size 3978401504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99aa915bcd142038bb0369663c8af65a5870a37cc198ad0b6e87786a4cec0c46
3
+ size 3992565472
model-00007-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e07762ad5a708f1d997eb9eb4a345ae8c4e587448f7585f5c9da4c9d82f0cfe
3
- size 3978401504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d02e7c1fa0a6aca98eb643a2df2c6b483d108dad5e9b7c9b5fd2bdbdc2a5db6
3
+ size 3992565472
model-00008-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7482977415c7e31d41f103c8f71a4f34dd2abeb49913d533d27ad3d708b52e35
3
- size 3899899712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd4076e8117ce301d7488c2707cc5dea92e726956fd4060b38087d293405b030
3
+ size 3914063680
model-00009-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a701214ea01fb1a5b3f6ebf13be0afa140b8b74a79b9c4da5efb3e8d0f80ac64
3
- size 3978401504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d0a5d19007565c00522f63e98b7fdcf8e81b8775eedecfeccd1a6161d2aa45f
3
+ size 3992565472
model-00010-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52d156b63833d447c6022c3b6ef7b36e7295228ccf348c26b640d3d8ada95476
3
- size 3978401504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfcd19e2a82637baeb21a811b49824ccc1bc657f04e57c1161d3c6eacd1b36f8
3
+ size 3992565472
model-00011-of-00011.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f68308b31bda9a52853a75565f701676c5869be3ce8dc64d9c5e8dc46a783b91
3
- size 3325018408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24b421ae6c69eef5024b72024cbe743bcc3546b99a068ff5bf1828cbf1f3dd5a
3
+ size 3328287016
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 42863488000
4
  },
5
  "weight_map": {
6
  "visual.patch_embed.proj.weight": "model-00001-of-00011.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 42994232320
4
  },
5
  "weight_map": {
6
  "visual.patch_embed.proj.weight": "model-00001-of-00011.safetensors",