#from transformers import PretrainedConfig from transformers import PretrainedConfig class ApolloConfig(PretrainedConfig): model_type = "apollo" def __init__( self, llm_cfg=None, vision_tower_cfg=None, mm_connector_cfg=None, architectures=None, resume_path=None, image_aspect_ratio=None, num_video_frames=None, mm_vision_select_layer=None, mm_vision_select_feature=None, use_mm_start_end=False, use_mm_patch_token=True, mm_connector_lr=None, vision_resolution=None, interpolate_mode=None, clip_duration=None, vocab_size=None, auto_map=None, **kwargs ): super().__init__(**kwargs) self.architectures = architectures self.llm_cfg = llm_cfg self.vision_tower_cfg = vision_tower_cfg self.mm_connector_cfg = mm_connector_cfg self.resume_path = resume_path self.image_aspect_ratio = image_aspect_ratio self.num_video_frames = num_video_frames self.mm_vision_select_layer = mm_vision_select_layer self.mm_vision_select_feature = mm_vision_select_feature self.use_mm_start_end = use_mm_start_end self.use_mm_patch_token = use_mm_patch_token self.mm_connector_lr = mm_connector_lr self.vision_resolution = vision_resolution self.interpolate_mode = interpolate_mode self.clip_duration = clip_duration self.vocab_size=vocab_size self.auto_map=auto_map