RaushanTurganbay HF staff commited on
Commit
6ae32f6
1 Parent(s): aba3cde

Upload LlavaNextVideoForConditionalGeneration

Browse files
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
- license: llama2
3
- pipeline_tag: image-text-to-text
4
  language:
5
  - en
 
 
6
  ---
7
 
8
  # LLaVA-NeXT-Video Model Card
 
1
  ---
 
 
2
  language:
3
  - en
4
+ license: llama2
5
+ pipeline_tag: image-text-to-text
6
  ---
7
 
8
  # LLaVA-NeXT-Video Model Card
config.json CHANGED
@@ -26,9 +26,10 @@
26
  ]
27
  ],
28
  "image_token_index": 32001,
29
- "model_type": "llava-next-video",
30
  "projector_hidden_act": "gelu",
31
  "spatial_pool_mode": "average",
 
32
  "spatial_pool_stride": 2,
33
  "text_config": {
34
  "_name_or_path": "lmsys/vicuna-7b-v1.5",
 
26
  ]
27
  ],
28
  "image_token_index": 32001,
29
+ "model_type": "llava_next",
30
  "projector_hidden_act": "gelu",
31
  "spatial_pool_mode": "average",
32
+ "spatial_pool_out_channels": 1024,
33
  "spatial_pool_stride": 2,
34
  "text_config": {
35
  "_name_or_path": "lmsys/vicuna-7b-v1.5",
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d5ba83428392aabef9b62c521eb9060aaa81c66c996235a18926b5f37efc437
3
  size 4992938952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc32753ce8e75e89748b95677d9349d2b47af998457b4ebe22d27dece7338a3d
3
  size 4992938952
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbd4b8ea0ade12963349edf94d3f420d48b2806811cf48a3fa315034e1576b88
3
  size 4176137496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8022077b98e08236a07b999f1f51ab577bda9c8aa2dc66d12853b1b162731100
3
  size 4176137496