VictorSanh commited on
Commit
aec559d
1 Parent(s): 682a420

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +17 -13
config.json CHANGED
@@ -5,7 +5,7 @@
5
  "alpha_type": "float",
6
  "alphas_initializer_range": 0.0,
7
  "architectures": [
8
- "IdeficsForCausalLM"
9
  ],
10
  "bos_token_id": 1,
11
  "cross_layer_activation_function": "swiglu",
@@ -28,22 +28,26 @@
28
  "num_hidden_layers": 32,
29
  "pad_token_id": 0,
30
  "qk_layer_norms": true,
31
- "qk_layer_norms_perceiver": true,
32
- "resampler_depth": 6,
33
- "resampler_head_dim": 96,
34
- "resampler_n_heads": 16,
35
- "resampler_n_latents": 64,
36
  "rms_norm_eps": 1e-06,
37
  "tie_word_embeddings": false,
38
  "torch_dtype": "bfloat16",
39
  "transformers_version": "4.28.0.dev0",
40
  "use_cache": true,
41
  "use_resampler": true,
42
- "vision_embed_dim": 1280,
43
- "vision_image_size": 224,
44
- "vision_intermediate_size": 5120,
45
- "vision_patch_size": 14,
46
- "vision_num_attention_heads": 16,
47
- "vision_num_hidden_layers": 32,
48
- "vocab_size": 32000
 
 
 
 
 
 
 
 
 
49
  }
 
5
  "alpha_type": "float",
6
  "alphas_initializer_range": 0.0,
7
  "architectures": [
8
+ "IdeficsForVisionText2Text"
9
  ],
10
  "bos_token_id": 1,
11
  "cross_layer_activation_function": "swiglu",
 
28
  "num_hidden_layers": 32,
29
  "pad_token_id": 0,
30
  "qk_layer_norms": true,
 
 
 
 
 
31
  "rms_norm_eps": 1e-06,
32
  "tie_word_embeddings": false,
33
  "torch_dtype": "bfloat16",
34
  "transformers_version": "4.28.0.dev0",
35
  "use_cache": true,
36
  "use_resampler": true,
37
+ "vocab_size": 32000,
38
+ "vision_config": {
39
+ "embed_dim": 1280,
40
+ "image_size": 224,
41
+ "intermediate_size": 5120,
42
+ "patch_size": 14,
43
+ "num_attention_heads": 16,
44
+ "num_hidden_layers": 32
45
+ },
46
+ "perceiver_config": {
47
+ "qk_layer_norms_perceiver": true,
48
+ "resampler_depth": 6,
49
+ "resampler_head_dim": 96,
50
+ "resampler_n_heads": 16,
51
+ "resampler_n_latents": 64
52
+ }
53
  }