PCIResearch commited on
Commit
f07b72c
1 Parent(s): c5ac1fe

Upload 3 files

Browse files

The visual_encoder for TransCore-M.

Files changed (3) hide show
  1. config.json +19 -0
  2. preprocessor_config.json +28 -0
  3. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/data/lmm_models/clip-vit-large-patch14-336",
3
+ "attention_dropout": 0.0,
4
+ "dropout": 0.0,
5
+ "hidden_act": "quick_gelu",
6
+ "hidden_size": 1024,
7
+ "image_size": 336,
8
+ "initializer_factor": 1.0,
9
+ "initializer_range": 0.02,
10
+ "intermediate_size": 4096,
11
+ "layer_norm_eps": 1e-05,
12
+ "model_type": "clip_vision_model",
13
+ "num_attention_heads": 16,
14
+ "num_channels": 3,
15
+ "num_hidden_layers": 24,
16
+ "patch_size": 14,
17
+ "projection_dim": 768,
18
+ "transformers_version": "4.31.0"
19
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 336,
4
+ "width": 336
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "feature_extractor_type": "CLIPFeatureExtractor",
12
+ "image_mean": [
13
+ 0.48145466,
14
+ 0.4578275,
15
+ 0.40821073
16
+ ],
17
+ "image_processor_type": "CLIPImageProcessor",
18
+ "image_std": [
19
+ 0.26862954,
20
+ 0.26130258,
21
+ 0.27577711
22
+ ],
23
+ "resample": 3,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "shortest_edge": 336
27
+ }
28
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d7c1dbc68ee9bd545517842d8137286e911254d028eb4258daedac303e46c80
3
+ size 607144361