zwt123home123
/

InternVL2-26B-YOPO

Image-Text-to-Text

feature-extraction

Model card Files Files and versions Community

zwt123home123 commited on 13 days ago

Commit

1506a1b

•

1 Parent(s): 2c3c568

Update modeling_internlm2.py

Files changed (1) hide show

modeling_internlm2.py +3 -3

modeling_internlm2.py CHANGED Viewed

@@ -311,9 +311,9 @@ class InternLM2Attention(nn.Module):
         self.attncut = True
         self.headcut = True
         self.layercut = True
-        self.layercut_idx = 36
-        self.offset = 41
-        head_num=24
         self.mask = torch.load("headcut_mask/internvl2.0_26B/mask_"+str(head_num)+".pth")
     def _init_rope(self):
         if self.config.rope_scaling is None:

         self.attncut = True
         self.headcut = True
         self.layercut = True
+        self.layercut_idx = 36 # number of layer kept
+        self.offset = 41  # system prompt token length
+        head_num=24 # num of heads kept on average
         self.mask = torch.load("headcut_mask/internvl2.0_26B/mask_"+str(head_num)+".pth")
     def _init_rope(self):
         if self.config.rope_scaling is None: