danielhanchen
commited on
Commit
•
44fde8c
1
Parent(s):
f03063c
Upload MllamaForConditionalGeneration
Browse files- config.json +12 -38
- model-00001-of-00002.safetensors +2 -2
- model-00002-of-00002.safetensors +2 -2
- model.safetensors.index.json +0 -0
config.json
CHANGED
@@ -19,44 +19,18 @@
|
|
19 |
"multi_modal_projector",
|
20 |
"merger",
|
21 |
"modality_projection",
|
22 |
-
"
|
23 |
-
"
|
24 |
-
"vision_model.transformer.layers.
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
-
"
|
32 |
-
"
|
33 |
-
"
|
34 |
-
"vision_model.transformer.layers.12.mlp",
|
35 |
-
"vision_model.transformer.layers.13.mlp",
|
36 |
-
"vision_model.transformer.layers.14.mlp",
|
37 |
-
"vision_model.transformer.layers.15.mlp",
|
38 |
-
"vision_model.transformer.layers.16.mlp",
|
39 |
-
"vision_model.transformer.layers.17.mlp",
|
40 |
-
"vision_model.transformer.layers.18.mlp",
|
41 |
-
"vision_model.transformer.layers.19.mlp",
|
42 |
-
"vision_model.transformer.layers.20.mlp",
|
43 |
-
"vision_model.transformer.layers.21.mlp",
|
44 |
-
"vision_model.transformer.layers.22.mlp",
|
45 |
-
"vision_model.transformer.layers.23.mlp",
|
46 |
-
"vision_model.transformer.layers.24.mlp",
|
47 |
-
"vision_model.transformer.layers.25.mlp",
|
48 |
-
"vision_model.transformer.layers.26.mlp",
|
49 |
-
"vision_model.transformer.layers.27.mlp",
|
50 |
-
"vision_model.transformer.layers.28.mlp",
|
51 |
-
"vision_model.transformer.layers.29.mlp",
|
52 |
-
"vision_model.transformer.layers.30.mlp",
|
53 |
-
"vision_model.transformer.layers.31.mlp",
|
54 |
-
"vision_model.global_transformer.layers.0.mlp",
|
55 |
-
"vision_model.global_transformer.layers.1.mlp",
|
56 |
-
"vision_model.global_transformer.layers.2.mlp",
|
57 |
-
"vision_model.global_transformer.layers.3.mlp",
|
58 |
-
"vision_model.global_transformer.layers.4.mlp",
|
59 |
-
"vision_model.global_transformer.layers.5.mlp"
|
60 |
],
|
61 |
"llm_int8_threshold": 6.0,
|
62 |
"load_in_4bit": true,
|
|
|
19 |
"multi_modal_projector",
|
20 |
"merger",
|
21 |
"modality_projection",
|
22 |
+
"language_model.model.layers.1.self_attn",
|
23 |
+
"language_model.model.layers.1.mlp",
|
24 |
+
"vision_model.transformer.layers.13.mlp.fc2",
|
25 |
+
"language_model.model.layers.8.cross_attn.o_proj",
|
26 |
+
"language_model.model.layers.13.cross_attn.o_proj",
|
27 |
+
"language_model.model.layers.13.mlp.down_proj",
|
28 |
+
"language_model.model.layers.18.cross_attn.o_proj",
|
29 |
+
"language_model.model.layers.18.mlp.down_proj",
|
30 |
+
"language_model.model.layers.23.cross_attn.o_proj",
|
31 |
+
"language_model.model.layers.28.cross_attn.o_proj",
|
32 |
+
"language_model.model.layers.33.cross_attn.o_proj",
|
33 |
+
"language_model.model.layers.38.cross_attn.o_proj"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
],
|
35 |
"llm_int8_threshold": 6.0,
|
36 |
"load_in_4bit": true,
|
model-00001-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afad208b9b805474e7f5d8de82043cf970f6e799c0b655cd6c6e522b9371e618
|
3 |
+
size 4971535505
|
model-00002-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc63401a455ef422970874eabac70ebf6380eb565c592341c4932092f569f720
|
3 |
+
size 2937067316
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|