Fudan-FUXI commited on
Commit
c3f8d9e
·
verified ·
1 Parent(s): 47d81b8

Upload 4 files

Browse files
Files changed (3) hide show
  1. adapter_config.json +103 -103
  2. adapter_model.safetensors +1 -1
  3. config.json +2 -2
adapter_config.json CHANGED
@@ -20,130 +20,130 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "35.self_attn.k_proj",
24
- "model.layers.4.self_attn.q_proj",
25
- "27.self_attn.k_proj",
26
  "model.layers.25.self_attn.q_proj",
27
- "model.layers.10.self_attn.v_proj",
28
- "38.self_attn.v_proj",
29
- "model.layers.6.self_attn.k_proj",
30
- "model.layers.6.self_attn.v_proj",
31
- "30.self_attn.v_proj",
32
- "model.layers.18.self_attn.k_proj",
33
- "model.layers.13.self_attn.q_proj",
34
- "model.layers.11.self_attn.q_proj",
35
- "37.self_attn.q_proj",
36
- "model.layers.19.self_attn.k_proj",
37
- "model.layers.12.self_attn.k_proj",
38
- "model.layers.26.self_attn.q_proj",
39
- "model.layers.22.self_attn.q_proj",
40
- "model.layers.12.self_attn.q_proj",
41
  "model.layers.11.self_attn.k_proj",
42
- "33.self_attn.v_proj",
43
- "model.layers.13.self_attn.k_proj",
44
- "model.layers.13.self_attn.v_proj",
45
- "model.layers.18.self_attn.v_proj",
46
- "31.self_attn.v_proj",
47
- "29.self_attn.k_proj",
48
- "38.self_attn.q_proj",
49
- "model.layers.25.self_attn.v_proj",
50
  "model.layers.7.self_attn.v_proj",
51
- "model.layers.20.self_attn.q_proj",
52
- "model.layers.1.self_attn.k_proj",
53
- "39.self_attn.k_proj",
54
- "36.self_attn.k_proj",
55
- "model.layers.10.self_attn.q_proj",
56
- "28.self_attn.k_proj",
57
- "27.self_attn.q_proj",
58
- "model.layers.9.self_attn.q_proj",
59
- "28.self_attn.q_proj",
60
- "model.layers.6.self_attn.q_proj",
61
- "34.self_attn.v_proj",
62
- "model.layers.8.self_attn.k_proj",
63
- "model.layers.25.self_attn.k_proj",
64
  "model.layers.16.self_attn.k_proj",
65
- "model.layers.7.self_attn.k_proj",
 
 
 
66
  "31.self_attn.q_proj",
67
- "28.self_attn.v_proj",
68
- "model.layers.14.self_attn.k_proj",
69
- "up_proj",
 
70
  "model.layers.10.self_attn.k_proj",
71
- "model.layers.19.self_attn.v_proj",
72
- "model.layers.19.self_attn.q_proj",
73
- "model.layers.21.self_attn.q_proj",
74
- "model.layers.12.self_attn.v_proj",
75
- "model.layers.23.self_attn.k_proj",
76
  "39.self_attn.v_proj",
 
 
 
 
 
 
 
 
 
 
77
  "model.layers.26.self_attn.v_proj",
78
- "36.self_attn.v_proj",
79
- "32.self_attn.k_proj",
80
- "37.self_attn.k_proj",
81
- "model.layers.0.self_attn.q_proj",
82
  "model.layers.2.self_attn.q_proj",
83
- "o_proj",
84
- "30.self_attn.k_proj",
85
- "29.self_attn.v_proj",
86
- "model.layers.7.self_attn.q_proj",
87
  "down_proj",
88
- "model.layers.17.self_attn.k_proj",
 
 
89
  "model.layers.15.self_attn.v_proj",
90
- "38.self_attn.k_proj",
91
- "35.self_attn.v_proj",
92
- "model.layers.15.self_attn.q_proj",
93
- "model.layers.23.self_attn.q_proj",
94
- "model.layers.21.self_attn.k_proj",
95
- "model.layers.4.self_attn.k_proj",
96
- "model.layers.17.self_attn.v_proj",
97
- "33.self_attn.k_proj",
98
- "model.layers.22.self_attn.k_proj",
99
- "34.self_attn.k_proj",
100
- "model.layers.5.self_attn.k_proj",
101
- "32.self_attn.q_proj",
102
- "model.layers.17.self_attn.q_proj",
103
- "model.layers.22.self_attn.v_proj",
104
- "model.layers.2.self_attn.v_proj",
105
- "model.layers.20.self_attn.v_proj",
106
- "model.layers.23.self_attn.v_proj",
107
- "30.self_attn.q_proj",
108
- "model.layers.1.self_attn.q_proj",
109
- "31.self_attn.k_proj",
110
  "32.self_attn.v_proj",
111
- "model.layers.14.self_attn.q_proj",
 
 
 
 
112
  "model.layers.1.self_attn.v_proj",
113
- "model.layers.14.self_attn.v_proj",
114
- "model.layers.2.self_attn.k_proj",
115
  "model.layers.5.self_attn.q_proj",
116
- "model.layers.5.self_attn.v_proj",
117
- "model.layers.24.self_attn.k_proj",
118
- "27.self_attn.v_proj",
119
- "model.layers.8.self_attn.q_proj",
 
120
  "model.layers.21.self_attn.v_proj",
 
 
 
 
 
 
121
  "37.self_attn.v_proj",
122
- "29.self_attn.q_proj",
123
- "model.layers.11.self_attn.v_proj",
124
- "model.layers.9.self_attn.k_proj",
125
- "model.layers.18.self_attn.q_proj",
126
- "model.layers.0.self_attn.v_proj",
127
- "39.self_attn.q_proj",
128
- "33.self_attn.q_proj",
129
- "model.layers.16.self_attn.q_proj",
130
  "model.layers.0.self_attn.k_proj",
131
- "model.layers.26.self_attn.k_proj",
132
  "36.self_attn.q_proj",
133
- "34.self_attn.q_proj",
134
- "model.layers.9.self_attn.v_proj",
135
- "model.layers.24.self_attn.q_proj",
136
- "model.layers.3.self_attn.q_proj",
137
- "model.layers.20.self_attn.k_proj",
138
- "35.self_attn.q_proj",
139
- "model.layers.3.self_attn.v_proj",
140
- "model.layers.16.self_attn.v_proj",
 
141
  "model.layers.3.self_attn.k_proj",
 
 
 
 
 
 
 
 
142
  "model.layers.15.self_attn.k_proj",
143
- "model.layers.8.self_attn.v_proj",
144
- "gate_proj",
145
  "model.layers.24.self_attn.v_proj",
146
- "model.layers.4.self_attn.v_proj"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
147
  ],
148
  "task_type": "CAUSAL_LM",
149
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "model.layers.0.self_attn.v_proj",
 
 
24
  "model.layers.25.self_attn.q_proj",
25
+ "model.layers.14.self_attn.q_proj",
26
+ "model.layers.24.self_attn.k_proj",
27
+ "o_proj",
28
+ "model.layers.15.self_attn.q_proj",
 
 
 
 
 
 
 
 
 
 
29
  "model.layers.11.self_attn.k_proj",
 
 
 
 
 
 
 
 
30
  "model.layers.7.self_attn.v_proj",
31
+ "29.self_attn.q_proj",
32
+ "model.layers.19.self_attn.k_proj",
33
+ "34.self_attn.q_proj",
34
+ "model.layers.14.self_attn.v_proj",
 
 
 
 
 
 
 
 
 
35
  "model.layers.16.self_attn.k_proj",
36
+ "model.layers.22.self_attn.v_proj",
37
+ "model.layers.25.self_attn.v_proj",
38
+ "34.self_attn.v_proj",
39
+ "model.layers.19.self_attn.v_proj",
40
  "31.self_attn.q_proj",
41
+ "39.self_attn.q_proj",
42
+ "29.self_attn.k_proj",
43
+ "model.layers.11.self_attn.v_proj",
44
+ "model.layers.22.self_attn.k_proj",
45
  "model.layers.10.self_attn.k_proj",
46
+ "model.layers.26.self_attn.k_proj",
 
 
 
 
47
  "39.self_attn.v_proj",
48
+ "model.layers.4.self_attn.q_proj",
49
+ "model.layers.8.self_attn.k_proj",
50
+ "model.layers.6.self_attn.q_proj",
51
+ "model.layers.11.self_attn.q_proj",
52
+ "38.self_attn.q_proj",
53
+ "model.layers.16.self_attn.q_proj",
54
+ "model.layers.19.self_attn.q_proj",
55
+ "model.layers.12.self_attn.k_proj",
56
+ "33.self_attn.q_proj",
57
+ "model.layers.13.self_attn.q_proj",
58
  "model.layers.26.self_attn.v_proj",
59
+ "31.self_attn.v_proj",
60
+ "model.layers.17.self_attn.v_proj",
61
+ "38.self_attn.k_proj",
62
+ "model.layers.25.self_attn.k_proj",
63
  "model.layers.2.self_attn.q_proj",
 
 
 
 
64
  "down_proj",
65
+ "27.self_attn.v_proj",
66
+ "model.layers.2.self_attn.k_proj",
67
+ "model.layers.24.self_attn.q_proj",
68
  "model.layers.15.self_attn.v_proj",
69
+ "35.self_attn.q_proj",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  "32.self_attn.v_proj",
71
+ "31.self_attn.k_proj",
72
+ "model.layers.17.self_attn.k_proj",
73
+ "model.layers.12.self_attn.q_proj",
74
+ "model.layers.16.self_attn.v_proj",
75
+ "gate_proj",
76
  "model.layers.1.self_attn.v_proj",
77
+ "model.layers.18.self_attn.q_proj",
 
78
  "model.layers.5.self_attn.q_proj",
79
+ "model.layers.20.self_attn.v_proj",
80
+ "model.layers.3.self_attn.q_proj",
81
+ "model.layers.21.self_attn.q_proj",
82
+ "35.self_attn.v_proj",
83
+ "model.layers.23.self_attn.v_proj",
84
  "model.layers.21.self_attn.v_proj",
85
+ "model.layers.20.self_attn.q_proj",
86
+ "model.layers.13.self_attn.k_proj",
87
+ "27.self_attn.q_proj",
88
+ "model.layers.2.self_attn.v_proj",
89
+ "model.layers.14.self_attn.k_proj",
90
+ "model.layers.7.self_attn.q_proj",
91
  "37.self_attn.v_proj",
92
+ "model.layers.3.self_attn.v_proj",
93
+ "33.self_attn.k_proj",
94
+ "36.self_attn.v_proj",
 
 
 
 
 
95
  "model.layers.0.self_attn.k_proj",
96
+ "37.self_attn.q_proj",
97
  "36.self_attn.q_proj",
98
+ "30.self_attn.v_proj",
99
+ "30.self_attn.k_proj",
100
+ "34.self_attn.k_proj",
101
+ "model.layers.7.self_attn.k_proj",
102
+ "37.self_attn.k_proj",
103
+ "28.self_attn.v_proj",
104
+ "32.self_attn.q_proj",
105
+ "30.self_attn.q_proj",
106
+ "model.layers.18.self_attn.v_proj",
107
  "model.layers.3.self_attn.k_proj",
108
+ "27.self_attn.k_proj",
109
+ "model.layers.8.self_attn.q_proj",
110
+ "model.layers.9.self_attn.k_proj",
111
+ "32.self_attn.k_proj",
112
+ "model.layers.18.self_attn.k_proj",
113
+ "model.layers.6.self_attn.v_proj",
114
+ "model.layers.10.self_attn.q_proj",
115
+ "28.self_attn.k_proj",
116
  "model.layers.15.self_attn.k_proj",
117
+ "33.self_attn.v_proj",
118
+ "model.layers.1.self_attn.q_proj",
119
  "model.layers.24.self_attn.v_proj",
120
+ "model.layers.4.self_attn.k_proj",
121
+ "model.layers.23.self_attn.q_proj",
122
+ "model.layers.9.self_attn.q_proj",
123
+ "model.layers.13.self_attn.v_proj",
124
+ "model.layers.23.self_attn.k_proj",
125
+ "model.layers.20.self_attn.k_proj",
126
+ "model.layers.17.self_attn.q_proj",
127
+ "model.layers.22.self_attn.q_proj",
128
+ "model.layers.21.self_attn.k_proj",
129
+ "35.self_attn.k_proj",
130
+ "model.layers.5.self_attn.k_proj",
131
+ "model.layers.6.self_attn.k_proj",
132
+ "model.layers.12.self_attn.v_proj",
133
+ "36.self_attn.k_proj",
134
+ "28.self_attn.q_proj",
135
+ "model.layers.1.self_attn.k_proj",
136
+ "model.layers.8.self_attn.v_proj",
137
+ "model.layers.5.self_attn.v_proj",
138
+ "model.layers.26.self_attn.q_proj",
139
+ "29.self_attn.v_proj",
140
+ "model.layers.4.self_attn.v_proj",
141
+ "up_proj",
142
+ "model.layers.0.self_attn.q_proj",
143
+ "39.self_attn.k_proj",
144
+ "38.self_attn.v_proj",
145
+ "model.layers.10.self_attn.v_proj",
146
+ "model.layers.9.self_attn.v_proj"
147
  ],
148
  "task_type": "CAUSAL_LM",
149
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c751b388d0af63dc7e757fc16bfb817a26fd4a33ef522f2b668f381a85173df
3
  size 1001469184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fccb793e8a9c714b86ec6ef72647ec0799926358ef5c7519f8ac96a02a46ac1
3
  size 1001469184
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./checkpoints/24-1107-vila-v1.5-13b-lora-r128-alpha256-lr-1e5-hdvila1000+human_feedback_multi_level-25epoch-release",
3
  "architectures": [
4
  "LlavaLlamaModel"
5
  ],
@@ -167,7 +167,7 @@
167
  "model_dtype": "torch.bfloat16",
168
  "model_type": "llava_llama",
169
  "num_video_frames": 8,
170
- "resume_path": "./checkpoints/24-1107-vila-v1.5-13b-lora-r128-alpha256-lr-1e5-hdvila1000+human_feedback_multi_level-25epoch-release",
171
  "s2": false,
172
  "s2_max_split_size": 336,
173
  "s2_scales": "336,672,1008",
 
1
  {
2
+ "_name_or_path": "./checkpoints/LiFT-Critic-13b",
3
  "architectures": [
4
  "LlavaLlamaModel"
5
  ],
 
167
  "model_dtype": "torch.bfloat16",
168
  "model_type": "llava_llama",
169
  "num_video_frames": 8,
170
+ "resume_path": "./checkpoints/LiFT-Critic-13b",
171
  "s2": false,
172
  "s2_max_split_size": 336,
173
  "s2_scales": "336,672,1008",