Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +61 -0
- generation_config.json +10 -0
- latest +1 -0
- model-00001-of-00006.safetensors +3 -0
- model-00002-of-00006.safetensors +3 -0
- model-00003-of-00006.safetensors +3 -0
- model-00004-of-00006.safetensors +3 -0
- model-00005-of-00006.safetensors +3 -0
- model-00006-of-00006.safetensors +3 -0
- model.safetensors.index.json +0 -0
- rng_state_0.pth +3 -0
- rng_state_1.pth +3 -0
- rng_state_10.pth +3 -0
- rng_state_100.pth +3 -0
- rng_state_101.pth +3 -0
- rng_state_102.pth +3 -0
- rng_state_103.pth +3 -0
- rng_state_104.pth +3 -0
- rng_state_105.pth +3 -0
- rng_state_106.pth +3 -0
- rng_state_107.pth +3 -0
- rng_state_108.pth +3 -0
- rng_state_109.pth +3 -0
- rng_state_11.pth +3 -0
- rng_state_110.pth +3 -0
- rng_state_111.pth +3 -0
- rng_state_112.pth +3 -0
- rng_state_113.pth +3 -0
- rng_state_114.pth +3 -0
- rng_state_115.pth +3 -0
- rng_state_116.pth +3 -0
- rng_state_117.pth +3 -0
- rng_state_118.pth +3 -0
- rng_state_119.pth +3 -0
- rng_state_12.pth +3 -0
- rng_state_120.pth +3 -0
- rng_state_121.pth +3 -0
- rng_state_122.pth +3 -0
- rng_state_123.pth +3 -0
- rng_state_124.pth +3 -0
- rng_state_125.pth +3 -0
- rng_state_126.pth +3 -0
- rng_state_127.pth +3 -0
- rng_state_13.pth +3 -0
- rng_state_14.pth +3 -0
- rng_state_15.pth +3 -0
- rng_state_16.pth +3 -0
- rng_state_17.pth +3 -0
- rng_state_18.pth +3 -0
- rng_state_19.pth +3 -0
config.json
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/fsx-project/xichenpan/PISCES/clip-evaclip-und-gen-pretrain-long-caption-70M/checkpoint-76000",
|
3 |
+
"architectures": [
|
4 |
+
"LlavaLlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"freeze_mm_mlp_adapter": false,
|
15 |
+
"gen_hidden_size": 1792,
|
16 |
+
"gen_pooling": "early_pool2d_4",
|
17 |
+
"gen_projector_type": "mlp2x_gelu",
|
18 |
+
"gen_vision_tower": "eva-clip-E-14-plus",
|
19 |
+
"hidden_act": "silu",
|
20 |
+
"hidden_size": 4096,
|
21 |
+
"image_aspect_ratio": "square",
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 14336,
|
24 |
+
"max_position_embeddings": 131072,
|
25 |
+
"mlp_bias": false,
|
26 |
+
"mm_hidden_size": 1152,
|
27 |
+
"mm_patch_merge_type": "flat",
|
28 |
+
"mm_projector_lr": null,
|
29 |
+
"mm_projector_type": "mlp2x_gelu",
|
30 |
+
"mm_use_im_patch_token": false,
|
31 |
+
"mm_use_im_start_end": false,
|
32 |
+
"mm_vision_select_feature": "patch",
|
33 |
+
"mm_vision_select_layer": -2,
|
34 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
35 |
+
"model_type": "llava_llama",
|
36 |
+
"n_query": 64,
|
37 |
+
"num_attention_heads": 32,
|
38 |
+
"num_hidden_layers": 32,
|
39 |
+
"num_key_value_heads": 8,
|
40 |
+
"pad_token_id": 128256,
|
41 |
+
"pretraining_tp": 1,
|
42 |
+
"rms_norm_eps": 1e-05,
|
43 |
+
"rope_scaling": {
|
44 |
+
"factor": 8.0,
|
45 |
+
"high_freq_factor": 4.0,
|
46 |
+
"low_freq_factor": 1.0,
|
47 |
+
"original_max_position_embeddings": 8192,
|
48 |
+
"rope_type": "llama3"
|
49 |
+
},
|
50 |
+
"rope_theta": 500000.0,
|
51 |
+
"tie_word_embeddings": false,
|
52 |
+
"tokenizer_model_max_length": 2048,
|
53 |
+
"tokenizer_padding_side": "right",
|
54 |
+
"torch_dtype": "bfloat16",
|
55 |
+
"transformers_version": "4.43.1",
|
56 |
+
"tune_mm_mlp_adapter": false,
|
57 |
+
"use_cache": false,
|
58 |
+
"use_mm_proj": true,
|
59 |
+
"vision_tower_pretrained": null,
|
60 |
+
"vocab_size": 128260
|
61 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"transformers_version": "4.43.1"
|
10 |
+
}
|
latest
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
global_step2181
|
model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a9e2b32bde579a8af7aa7ff334268054e1973e7e4784b784dce00fbdd73fa71
|
3 |
+
size 4976731440
|
model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ad337522f3b09f325ab9fa27dcacd88b401d49a7d53081a6ae71315c246968b
|
3 |
+
size 4999802720
|
model-00003-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:112610dd4b087f759db44b30cbc1baa4e3791e35ec621b3566566bad3c201226
|
3 |
+
size 4915916176
|
model-00004-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa36cad7493429e5ed64ca475012125b2dcebfa360e712da4ec47217f6d469ff
|
3 |
+
size 4999640736
|
model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd670041a4feb23fe022e820d9e39a02c4ce418b7e0da8d74642f2a216b8e0e2
|
3 |
+
size 4783899064
|
model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:379519f4028e2de1353ea12c737a8bb43235f2dbe3323d290c919893e496c452
|
3 |
+
size 1050706048
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08282b46825aa78d10fe10e3fea89555c5b5a691b261a3ddfd58fcb58370edff
|
3 |
+
size 15984
|
rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbab71d98a3a9a92df82a6bba463947327c3a1bcf35cd9f4f46114641fc42dd9
|
3 |
+
size 15984
|
rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54e5c2d65c14df39137f6a3bd8314f534dad93d72efe8e40e23a61187ba74ce8
|
3 |
+
size 15997
|
rng_state_100.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3348f3273bba5031460ff72f828dea6495a28aefdcd45b867b6b13f07d894486
|
3 |
+
size 16010
|
rng_state_101.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c1a8f1f76d6695d77ae3f0409b5f706823dea2abd1e9c1e6a087172edef142b
|
3 |
+
size 16010
|
rng_state_102.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0788302ee891c711bd0de0decb3473a7c782ddcc1a4b27ba03a807970f328c04
|
3 |
+
size 16010
|
rng_state_103.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b28e67cc65c3e4f4f358aa401694fa7730976852b3e13b80091f85f64b7a6eb
|
3 |
+
size 16010
|
rng_state_104.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f16ea3fa6dca9cfedace2ce355a83089017d457314a1e9663bb27ee6baa3a54f
|
3 |
+
size 16010
|
rng_state_105.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25f8a4db0b06b5a4a4b3532311df15bd80ffb0cc8acc6e501e2a40750c6a110b
|
3 |
+
size 16010
|
rng_state_106.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd82150caf6137522184645dfed99e9cb655f60664fe5acc2a2d47138674b24
|
3 |
+
size 16010
|
rng_state_107.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4b09e28acb0dcb65ae126cec7c010223226ceb3c696ebbdec7e3ead29eae357
|
3 |
+
size 16010
|
rng_state_108.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e06c8d01f5ff1cd85a48f6cdbfb3d1e361ac210a6d9ca8d05340fa6e27f2ee2
|
3 |
+
size 16010
|
rng_state_109.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f23768cabf8f0cbb22f051c8a6a8d0ad5c6cde80042119e0ce0551ab3643a38
|
3 |
+
size 16010
|
rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f578146bcaaed333cf4637aa3b454e2f6238e691e45b4160001b63b4f8b5ce4e
|
3 |
+
size 15997
|
rng_state_110.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5872ce3bb6df4d00c5ef40ee7f5f8c4883ac9a78593dab828fbde6a9de7406
|
3 |
+
size 16010
|
rng_state_111.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83457e579f37b67caf78db123682a095631fae347086152e842de889f9361cf6
|
3 |
+
size 16010
|
rng_state_112.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4ead6f9d6c9ceb5a3ae07bfc3c3a7c92bde5b2f84c3f8160ebc7d9fea3a2a28
|
3 |
+
size 16010
|
rng_state_113.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9952b458df627d851633776836c9967df761e1431dc86626dd012482676e80a4
|
3 |
+
size 16010
|
rng_state_114.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b22ba28409b8d67f28808836de79aef45571f4229e16801c1b807ff6a9263fba
|
3 |
+
size 16010
|
rng_state_115.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:074579558cac067c2f5af51b47d9011e8be1f7603fe8f6eeb908d89a61092b1c
|
3 |
+
size 16010
|
rng_state_116.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97d0f43669be568d9d0d4ce3f2bd7735f7b5a22d1fbf8fabfbbb5a71451d6fa8
|
3 |
+
size 16010
|
rng_state_117.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5086a5b6e47114ffba841e4ab1a7c85050706e578a24bffc0d494b47bccb0521
|
3 |
+
size 16010
|
rng_state_118.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc3fc5a47bab9cbee554ced02fb28e785c754412c70420f15af7649706fefb9e
|
3 |
+
size 16010
|
rng_state_119.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c82830fa5ad835ef57e7307501cae3e1394b32f672acceb5d40d800d19785a4c
|
3 |
+
size 16010
|
rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8463662162a837871bb50af43a407175ca95f3f364bc13c7d065e8b6929bad11
|
3 |
+
size 15997
|
rng_state_120.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e31fe7640ea11e1d797ada7476f7bdc37d6064763d107f4c679cfa402366b6c
|
3 |
+
size 16010
|
rng_state_121.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d2823072ec92703cf2e175896c8da4393d3cc28e4b18c866d48ba728c92d429
|
3 |
+
size 16010
|
rng_state_122.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6e9b024d5ca860c40ece9a131f8ea4a44e31b793fce79a070be11fb9079bd23
|
3 |
+
size 16010
|
rng_state_123.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59008bff551b6589638f02ce6d8cb020b65015af673a55372988767751117b17
|
3 |
+
size 16010
|
rng_state_124.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:690cadbcf664e76a148a493b336f3453607353be0c3116f0a00b9489516a2938
|
3 |
+
size 16010
|
rng_state_125.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c45e8b7a958fe440baf7992d7b08940c80386f552e1100a2a3810ce4a9d4d01
|
3 |
+
size 16010
|
rng_state_126.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d2f8dec72b4197cd7507923ea29c9d82731ec410be50aa83306fe3272146049
|
3 |
+
size 16010
|
rng_state_127.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d84dc9619c55b5d3d908b2a1ba9eced39badbd9b59272791bd06cd7e22db3e71
|
3 |
+
size 16010
|
rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe9bafd75244b907f13aa5b102963f4d018d7b80b94ddb0262313774362d9305
|
3 |
+
size 15997
|
rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5e353c1ca54c464e3464d695507da7da6c134e4ad9d6acab6f72e52d5bf13c7
|
3 |
+
size 15997
|
rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24f1ef20cfc904ac8f811ceffab91f00cccadca0e878c8ef8a7335e83ef9513f
|
3 |
+
size 15997
|
rng_state_16.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cecf995eb1b13a85a673384ed67c75acc989e9d373ac7da2d90cbc7af2c1b4a7
|
3 |
+
size 15997
|
rng_state_17.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:375986c2a348f319aeed3322fcf23be7787f801c585046ff217d7855463fbc0d
|
3 |
+
size 15997
|
rng_state_18.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a50dfdcb902d78e55850cabc410552a4e651090792c2e086926cbda383b4f35f
|
3 |
+
size 15997
|
rng_state_19.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79850d41cfed8d83ef96222b2b956a0ec273b7fa78630d3cb0e86f2ab29bb934
|
3 |
+
size 15997
|