thdangtr commited on
Commit
c6ffafc
1 Parent(s): 6e82ba2
Files changed (2) hide show
  1. config.json +8 -3
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "Salesforce/blip-vqa-capfilt-large",
3
  "architectures": [
4
- "BlipForQuestionAnswering"
5
  ],
6
  "image_text_hidden_size": 256,
7
  "initializer_factor": 1.0,
@@ -11,6 +11,7 @@
11
  "model_type": "blip",
12
  "projection_dim": 512,
13
  "text_config": {
 
14
  "initializer_factor": 1.0,
15
  "model_type": "blip_text_model",
16
  "num_attention_heads": 12
@@ -19,9 +20,13 @@
19
  "transformers_version": "4.39.3",
20
  "vision_config": {
21
  "dropout": 0.0,
 
22
  "initializer_factor": 1.0,
23
  "initializer_range": 0.02,
 
24
  "model_type": "blip_vision_model",
25
- "num_channels": 3
 
 
26
  }
27
  }
 
1
  {
2
+ "_name_or_path": "Salesforce/blip-image-captioning-large",
3
  "architectures": [
4
+ "BlipForConditionalGeneration"
5
  ],
6
  "image_text_hidden_size": 256,
7
  "initializer_factor": 1.0,
 
11
  "model_type": "blip",
12
  "projection_dim": 512,
13
  "text_config": {
14
+ "encoder_hidden_size": 1024,
15
  "initializer_factor": 1.0,
16
  "model_type": "blip_text_model",
17
  "num_attention_heads": 12
 
20
  "transformers_version": "4.39.3",
21
  "vision_config": {
22
  "dropout": 0.0,
23
+ "hidden_size": 1024,
24
  "initializer_factor": 1.0,
25
  "initializer_range": 0.02,
26
+ "intermediate_size": 4096,
27
  "model_type": "blip_vision_model",
28
+ "num_attention_heads": 16,
29
+ "num_channels": 3,
30
+ "num_hidden_layers": 24
31
  }
32
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e0bcd3494b46756684ddc3c9286ed9c32717ad4d37e9c1d62869add2110e829
3
- size 1538792184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86bdefcfb2181f13b351e486bc6508804c8dfd5dce98ec9d0e2efffff325c192
3
+ size 1879010480