Image-Text-to-Text
OpenCLIP
File size: 794 Bytes
fb81a6b
 
e94397e
fb81a6b
 
e94397e
 
fb81a6b
 
 
 
 
 
 
 
 
e94397e
 
 
fb81a6b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
{
  "model_cfg": {
    "embed_dim": 768,
    "vision_cfg": {
      "image_size": 336,
      "layers": 24,
      "width": 1024,
      "patch_size": 14,
      "no_ln_pre": true,
      "pool_type": "avg",
      "final_ln_after_pool": true
    },
    "text_cfg": {
      "context_length": 128,
      "vocab_size": 32000,
      "vocab_path": "/home/zwang615/code/open_source/Double_Visual_Defense/CLIP_benchmark/clip_benchmark/open_clip/bert_base_vocab_bos_eos.txt",
      "width": 768,
      "heads": 12,
      "layers": 12,
      "pool_type": "last",
      "no_causal_mask": false
    }
  },
  "preprocess_cfg": {
    "mean": [
      0.485,
      0.456,
      0.406
    ],
    "std": [
      0.229,
      0.224,
      0.225
    ],
    "interpolation": "bilinear",
    "resize_mode": "squash"
  }
}