openaccess-ai-collective
/

mighty-llama-1b

Text Generation

Model card Files Files and versions Community

winglian commited on Dec 21, 2023

Commit

78b3766

•

1 Parent(s): 65e027e

Update modeling_llama.py

Files changed (1) hide show

modeling_llama.py +3 -1

modeling_llama.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from typing import Optional, List, Union, Tuple
 import torch
-from transformers import LlamaModel, Cache, DynamicCache
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask_for_sdpa, \
     _prepare_4d_causal_attention_mask
 from transformers.modeling_outputs import BaseModelOutputWithPast
@@ -144,6 +144,8 @@ class MightyLlamaModel(LlamaModel):
 class MightyLlamaForCausalLM(LlamaForCausalLM):
     def __init__(self, config):
         super().__init__(config)
         self.model = MightyLlamaModel(config)

 from typing import Optional, List, Union, Tuple
 import torch
+from transformers import LlamaConfig, LlamaModel, Cache, DynamicCache
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask_for_sdpa, \
     _prepare_4d_causal_attention_mask
 from transformers.modeling_outputs import BaseModelOutputWithPast
 class MightyLlamaForCausalLM(LlamaForCausalLM):
+    config_class = LlamaConfig
     def __init__(self, config):
         super().__init__(config)
         self.model = MightyLlamaModel(config)