danielhanchen commited on
Commit
44fde8c
1 Parent(s): f03063c

Upload MllamaForConditionalGeneration

Browse files
config.json CHANGED
@@ -19,44 +19,18 @@
19
  "multi_modal_projector",
20
  "merger",
21
  "modality_projection",
22
- "vision_model.transformer.layers.0.mlp",
23
- "vision_model.transformer.layers.1.mlp",
24
- "vision_model.transformer.layers.2.mlp",
25
- "vision_model.transformer.layers.3.mlp",
26
- "vision_model.transformer.layers.4.mlp",
27
- "vision_model.transformer.layers.5.mlp",
28
- "vision_model.transformer.layers.6.mlp",
29
- "vision_model.transformer.layers.7.mlp",
30
- "vision_model.transformer.layers.8.mlp",
31
- "vision_model.transformer.layers.9.mlp",
32
- "vision_model.transformer.layers.10.mlp",
33
- "vision_model.transformer.layers.11.mlp",
34
- "vision_model.transformer.layers.12.mlp",
35
- "vision_model.transformer.layers.13.mlp",
36
- "vision_model.transformer.layers.14.mlp",
37
- "vision_model.transformer.layers.15.mlp",
38
- "vision_model.transformer.layers.16.mlp",
39
- "vision_model.transformer.layers.17.mlp",
40
- "vision_model.transformer.layers.18.mlp",
41
- "vision_model.transformer.layers.19.mlp",
42
- "vision_model.transformer.layers.20.mlp",
43
- "vision_model.transformer.layers.21.mlp",
44
- "vision_model.transformer.layers.22.mlp",
45
- "vision_model.transformer.layers.23.mlp",
46
- "vision_model.transformer.layers.24.mlp",
47
- "vision_model.transformer.layers.25.mlp",
48
- "vision_model.transformer.layers.26.mlp",
49
- "vision_model.transformer.layers.27.mlp",
50
- "vision_model.transformer.layers.28.mlp",
51
- "vision_model.transformer.layers.29.mlp",
52
- "vision_model.transformer.layers.30.mlp",
53
- "vision_model.transformer.layers.31.mlp",
54
- "vision_model.global_transformer.layers.0.mlp",
55
- "vision_model.global_transformer.layers.1.mlp",
56
- "vision_model.global_transformer.layers.2.mlp",
57
- "vision_model.global_transformer.layers.3.mlp",
58
- "vision_model.global_transformer.layers.4.mlp",
59
- "vision_model.global_transformer.layers.5.mlp"
60
  ],
61
  "llm_int8_threshold": 6.0,
62
  "load_in_4bit": true,
 
19
  "multi_modal_projector",
20
  "merger",
21
  "modality_projection",
22
+ "language_model.model.layers.1.self_attn",
23
+ "language_model.model.layers.1.mlp",
24
+ "vision_model.transformer.layers.13.mlp.fc2",
25
+ "language_model.model.layers.8.cross_attn.o_proj",
26
+ "language_model.model.layers.13.cross_attn.o_proj",
27
+ "language_model.model.layers.13.mlp.down_proj",
28
+ "language_model.model.layers.18.cross_attn.o_proj",
29
+ "language_model.model.layers.18.mlp.down_proj",
30
+ "language_model.model.layers.23.cross_attn.o_proj",
31
+ "language_model.model.layers.28.cross_attn.o_proj",
32
+ "language_model.model.layers.33.cross_attn.o_proj",
33
+ "language_model.model.layers.38.cross_attn.o_proj"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  ],
35
  "llm_int8_threshold": 6.0,
36
  "load_in_4bit": true,
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df871653461fc0de46e87c4ee385e4aa992867ca244439ca7ba52798299e64e5
3
- size 4990770382
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afad208b9b805474e7f5d8de82043cf970f6e799c0b655cd6c6e522b9371e618
3
+ size 4971535505
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd435129de51a39511eef736db475e561c794a0011910e1f96cf5c5ebd844f8d
3
- size 2974910239
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc63401a455ef422970874eabac70ebf6380eb565c592341c4932092f569f720
3
+ size 2937067316
model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff