usernameisanna commited on
Commit
70694b8
·
verified ·
1 Parent(s): 7e32e1b

Upload Blip2ForConditionalGeneration

Browse files
config.json CHANGED
@@ -1,23 +1,86 @@
1
  {
 
2
  "architectures": [
3
- "DeiTModel"
4
  ],
5
- "attention_head_size": 88,
6
- "attention_probs_dropout_prob": 0.0,
7
- "encoder_stride": 14,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.0,
10
- "hidden_size": 1408,
11
- "image_size": 224,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 3072,
14
- "layer_norm_eps": 1e-12,
15
- "model_type": "deit",
16
- "num_attention_heads": 16,
17
- "num_channels": 3,
18
- "num_hidden_layers": 12,
19
- "patch_size": 16,
20
- "qkv_bias": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.39.0.dev0"
 
 
 
 
 
 
 
 
23
  }
 
1
  {
2
+ "_name_or_path": "Salesforce/blip2-flan-t5-xl",
3
  "architectures": [
4
+ "Blip2ForConditionalGeneration"
5
  ],
6
+ "initializer_factor": 1.0,
 
 
 
 
 
 
7
  "initializer_range": 0.02,
8
+ "is_encoder_decoder": true,
9
+ "model_type": "blip-2",
10
+ "num_query_tokens": 32,
11
+ "qformer_config": {
12
+ "classifier_dropout": null,
13
+ "model_type": "blip_2_qformer"
14
+ },
15
+ "text_config": {
16
+ "architectures": [
17
+ "T5ForConditionalGeneration"
18
+ ],
19
+ "bos_token_id": 1,
20
+ "classifier_dropout": 0.0,
21
+ "d_ff": 5120,
22
+ "d_kv": 64,
23
+ "d_model": 2048,
24
+ "decoder_start_token_id": 0,
25
+ "dense_act_fn": "gelu",
26
+ "dropout_rate": 0.1,
27
+ "eos_token_id": 1,
28
+ "feed_forward_proj": "gated-gelu",
29
+ "initializer_factor": 1.0,
30
+ "is_encoder_decoder": true,
31
+ "is_gated_act": true,
32
+ "layer_norm_epsilon": 1e-06,
33
+ "model_type": "t5",
34
+ "n_positions": 512,
35
+ "num_decoder_layers": 24,
36
+ "num_heads": 32,
37
+ "num_layers": 24,
38
+ "output_past": true,
39
+ "pad_token_id": 0,
40
+ "relative_attention_max_distance": 128,
41
+ "relative_attention_num_buckets": 32,
42
+ "task_specific_params": {
43
+ "summarization": {
44
+ "early_stopping": true,
45
+ "length_penalty": 2.0,
46
+ "max_length": 200,
47
+ "min_length": 30,
48
+ "no_repeat_ngram_size": 3,
49
+ "num_beams": 4,
50
+ "prefix": "summarize: "
51
+ },
52
+ "translation_en_to_de": {
53
+ "early_stopping": true,
54
+ "max_length": 300,
55
+ "num_beams": 4,
56
+ "prefix": "translate English to German: "
57
+ },
58
+ "translation_en_to_fr": {
59
+ "early_stopping": true,
60
+ "max_length": 300,
61
+ "num_beams": 4,
62
+ "prefix": "translate English to French: "
63
+ },
64
+ "translation_en_to_ro": {
65
+ "early_stopping": true,
66
+ "max_length": 300,
67
+ "num_beams": 4,
68
+ "prefix": "translate English to Romanian: "
69
+ }
70
+ },
71
+ "tie_word_embeddings": false,
72
+ "torch_dtype": "float32",
73
+ "vocab_size": 32128
74
+ },
75
+ "tie_word_embeddings": false,
76
  "torch_dtype": "float32",
77
+ "transformers_version": "4.39.0.dev0",
78
+ "use_decoder_only_language_model": false,
79
+ "vision_config": {
80
+ "dropout": 0.0,
81
+ "initializer_factor": 1.0,
82
+ "model_type": "blip_2_vision_model",
83
+ "num_channels": 3,
84
+ "projection_dim": 512
85
+ }
86
  }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "decoder_start_token_id": 0,
5
+ "eos_token_id": 1,
6
+ "pad_token_id": 0,
7
+ "transformers_version": "4.39.0.dev0"
8
+ }
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36db2b49ed99e83be1519949ad0a9d2702a24defb7670bb5bcb339099c655112
3
+ size 4990211672
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e04e1abba46af55207c1bcf115290591c290c70c1a4a4cc179b0ccbe8e16187
3
+ size 4958174576
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e47bacac4a5ca7b7659fe15dbaf6f428d970bf06c123e83c5f6610c2be7c73c1
3
+ size 2687755952
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff