Jiayi-Pan commited on
Commit
b9ad3dc
1 Parent(s): 15e583c

090703911a95d53d3d23274aa821eafdd599b3aff0ab3dddc19850346ddd11f8

Browse files
Files changed (1) hide show
  1. model_config.json +82 -0
model_config.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_class": "FineTuneTrainCogAgentModel",
3
+ "tokenizer_type": "vicuna-7b-v1.5",
4
+ "num_layers": 32,
5
+ "hidden_size": 4096,
6
+ "num_attention_heads": 32,
7
+ "vocab_size": 32000,
8
+ "layernorm_order": "pre",
9
+ "model_parallel_size": 1,
10
+ "max_sequence_length": 4096,
11
+ "is_decoder": [
12
+ true,
13
+ true,
14
+ true,
15
+ true,
16
+ true,
17
+ true,
18
+ true,
19
+ true,
20
+ true,
21
+ true,
22
+ true,
23
+ true,
24
+ true,
25
+ true,
26
+ true,
27
+ true,
28
+ true,
29
+ true,
30
+ true,
31
+ true,
32
+ true,
33
+ true,
34
+ true,
35
+ true,
36
+ true,
37
+ true,
38
+ true,
39
+ true,
40
+ true,
41
+ true,
42
+ true,
43
+ true
44
+ ],
45
+ "cross_attn_hidden_size": 1024,
46
+ "use_bias": false,
47
+ "inner_hidden_size": 11008,
48
+ "cross_hidden_size_per_attention_head": 32,
49
+ "pre_seq_len": 8,
50
+ "lora_rank": 50,
51
+ "use_ptuning": false,
52
+ "use_lora": false,
53
+ "use_qlora": false,
54
+ "layer_range": null,
55
+ "image_length": 256,
56
+ "cross_image_pix": 1120,
57
+ "eva_args": {
58
+ "model_class": "EVA2CLIPModel",
59
+ "num_layers": 63,
60
+ "hidden_size": 1792,
61
+ "num_attention_heads": 16,
62
+ "vocab_size": 1,
63
+ "layernorm_order": "post",
64
+ "model_parallel_size": 1,
65
+ "max_sequence_length": 257,
66
+ "inner_hidden_size": 15360,
67
+ "use_final_layernorm": false,
68
+ "layernorm_epsilon": 1e-06,
69
+ "row_parallel_linear_final_bias": false,
70
+ "image_size": [
71
+ 224,
72
+ 224
73
+ ],
74
+ "pre_len": 1,
75
+ "post_len": 0,
76
+ "in_channels": 3,
77
+ "patch_size": 14
78
+ },
79
+ "bos_token_id": 1,
80
+ "eos_token_id": 2,
81
+ "pad_token_id": 0
82
+ }