Transformers
PyTorch
English
bridgetower
Inference Endpoints
shaoyent commited on
Commit
c60f1ee
1 Parent(s): 9088235

Remove image_size

Browse files
Files changed (1) hide show
  1. preprocessor_config.json +49 -51
preprocessor_config.json CHANGED
@@ -1,53 +1,51 @@
1
  {
2
-
3
- "cache_dir":"/tmp",
4
- "downstream_fusion":false,
5
- "downstream_fusion_layers":1,
6
- "downstream_fusion_method":"elmo",
7
- "drop_rate":0.1,
8
- "freeze_RoBERTa":false,
9
- "freeze_ViT":false,
10
- "freeze_layer_count_roberta":false,
11
- "freeze_layer_count_vit":false,
12
- "head_hidden_scale":2,
13
- "hidden_size":768,
14
- "image_size":288,
15
- "input_text_embed_size":768,
16
- "link_tower_shared":false,
17
- "link_tower_type":"add",
18
- "log_dir":"log_dir",
19
- "loss_names":{"contras": 0,
20
- "irtr": 0,
21
- "itm": 0,
22
- "mlm": 0,
23
- "mpp": 0,
24
- "nlvr2": 0,
25
- "snli": 0,
26
- "vcr": 0,
27
- "vcr_qar": 0,
28
- "vqa": 1},
29
- "max_text_len":50,
30
- "mlp_ratio":4,
31
- "model_type":"bridgetower",
32
- "num_heads":12,
33
- "num_layers":6,
34
- "num_nodes":1,
35
- "only_load_cross_modal_from_meter":false,
36
- "patch_size":16,
37
- "resolution_before":224,
38
- "stop_gradient":false,
39
- "task_head_layers":2,
40
- "test_only":false,
41
- "tokenizer":"roberta-base",
42
- "unfreeze_RoBERTa_attention":false,
43
- "unfreeze_RoBERTa_embeddings":false,
44
- "unfreeze_RoBERTa_encoder":false,
45
- "unfreeze_RoBERTa_layernorm":false,
46
- "unfreeze_ViT_attention":false,
47
- "unfreeze_ViT_layernorm":false,
48
- "vit":"ViT-B/16",
49
- "vit_layernorm_init_from_vit":false,
50
- "vit_layernorm_shared":true,
51
- "vit_remove_last":false,
52
- "vocab_size":50265
53
  }
 
1
  {
2
+ "downstream_fusion":false,
3
+ "downstream_fusion_layers":1,
4
+ "downstream_fusion_method":"elmo",
5
+ "drop_rate":0.1,
6
+ "freeze_RoBERTa":false,
7
+ "freeze_ViT":false,
8
+ "freeze_layer_count_roberta":false,
9
+ "freeze_layer_count_vit":false,
10
+ "head_hidden_scale":2,
11
+ "hidden_size":768,
12
+ "input_text_embed_size":768,
13
+ "link_tower_shared":false,
14
+ "link_tower_type":"add",
15
+ "log_dir":"log_dir",
16
+ "loss_names":{"contras": 0,
17
+ "irtr": 0,
18
+ "itm": 0,
19
+ "mlm": 0,
20
+ "mpp": 0,
21
+ "nlvr2": 0,
22
+ "snli": 0,
23
+ "vcr": 0,
24
+ "vcr_qar": 0,
25
+ "vqa": 1},
26
+ "max_text_len":50,
27
+ "mlp_ratio":4,
28
+ "model_type":"bridgetower",
29
+ "num_heads":12,
30
+ "num_layers":6,
31
+ "num_nodes":1,
32
+ "only_load_cross_modal_from_meter":false,
33
+ "patch_size":16,
34
+ "resolution_before":224,
35
+ "stop_gradient":false,
36
+ "size":288,
37
+ "task_head_layers":2,
38
+ "test_only":false,
39
+ "tokenizer":"roberta-base",
40
+ "unfreeze_RoBERTa_attention":false,
41
+ "unfreeze_RoBERTa_embeddings":false,
42
+ "unfreeze_RoBERTa_encoder":false,
43
+ "unfreeze_RoBERTa_layernorm":false,
44
+ "unfreeze_ViT_attention":false,
45
+ "unfreeze_ViT_layernorm":false,
46
+ "vit":"ViT-B/16",
47
+ "vit_layernorm_init_from_vit":false,
48
+ "vit_layernorm_shared":true,
49
+ "vit_remove_last":false,
50
+ "vocab_size":50265
 
 
51
  }