File size: 861 Bytes
5fc9df9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
{
  "_attn_implementation_autoset": true,
  "answer_space": [
    "1",
    "2",
    "3",
    "4",
    "bed",
    "books",
    "cabinet",
    "chair",
    "lamp",
    "paper",
    "photo",
    "picture",
    "pillow",
    "red",
    "sofa",
    "table",
    "white",
    "window"
  ],
  "base_model_name": "blip2",
  "classification_input_dim": 768,
  "dataset_name": "daquar",
  "image_text_hidden_size": 256,
  "image_token_index": null,
  "initializer_factor": 1.0,
  "initializer_range": 0.02,
  "interm_dim": 1024,
  "model_type": "blip-2",
  "multi_class_classifier": true,
  "num_query_tokens": 32,
  "qformer_config": {
    "model_type": "blip_2_qformer"
  },
  "text_config": {
    "model_type": "opt"
  },
  "transformers_version": "4.46.1",
  "use_decoder_only_language_model": true,
  "vision_config": {
    "model_type": "blip_2_vision_model"
  }
}