File size: 1,349 Bytes
779abe8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.

from transformers import PretrainedConfig


class InfiMMConfig(PretrainedConfig):
    model_type = "infimm"

    def __init__(
        self,
        model_type="infimm-zephyr",
        seq_length=1024,
        tokenizer_type="ZephyrTokenizer",
        torch_dtype="bfloat16",
        transformers_version="4.35.2",
        use_cache=True,
        use_flash_attn=False,
        cross_attn_every_n_layers=2,
        use_grad_checkpoint=False,
        freeze_llm=True,
        visual=None,
        language=None,
        image_token_id=None,
        eoc_token_id=None,
        **kwargs,
    ):
        self.model_type = model_type
        self.seq_length = seq_length
        self.tokenizer_type = tokenizer_type
        self.torch_dtype = torch_dtype
        self.transformers_version = transformers_version
        self.use_cache = use_cache
        self.use_flash_attn = use_flash_attn
        self.cross_attn_every_n_layers = cross_attn_every_n_layers
        self.use_grad_checkpoint = use_grad_checkpoint
        self.freeze_llm = freeze_llm
        self.visual = visual
        self.language = language
        self.image_token_id = image_token_id
        self.eoc_token_id = eoc_token_id
        super().__init__(**kwargs)