Update minigpt4/models/mini_gpt4.py
Browse files
minigpt4/models/mini_gpt4.py
CHANGED
@@ -87,16 +87,16 @@ class MiniGPT4(Blip2Base):
|
|
87 |
print('Loading Q-Former Done')
|
88 |
|
89 |
print('Loading LLAMA')
|
90 |
-
self.llama_tokenizer = LlamaTokenizer.from_pretrained('
|
91 |
self.llama_tokenizer.pad_token = self.llama_tokenizer.eos_token
|
92 |
|
93 |
if llama_cache_dir:
|
94 |
self.llama_model = LlamaForCausalLM.from_pretrained(
|
95 |
-
'
|
96 |
)
|
97 |
else:
|
98 |
self.llama_model = LlamaForCausalLM.from_pretrained(
|
99 |
-
'
|
100 |
)
|
101 |
for name, param in self.llama_model.named_parameters():
|
102 |
param.requires_grad = False
|
|
|
87 |
print('Loading Q-Former Done')
|
88 |
|
89 |
print('Loading LLAMA')
|
90 |
+
self.llama_tokenizer = LlamaTokenizer.from_pretrained('Selali/minigpt4', use_fast=False, use_auth_token=os.environ["API_TOKEN"])
|
91 |
self.llama_tokenizer.pad_token = self.llama_tokenizer.eos_token
|
92 |
|
93 |
if llama_cache_dir:
|
94 |
self.llama_model = LlamaForCausalLM.from_pretrained(
|
95 |
+
'Selali/minigpt4', load_in_8bit=True, torch_dtype=torch.float16, device_map="auto", use_auth_token=os.environ["API_TOKEN"]
|
96 |
)
|
97 |
else:
|
98 |
self.llama_model = LlamaForCausalLM.from_pretrained(
|
99 |
+
'Selali/minigpt4', load_in_8bit=True, torch_dtype=torch.float16, device_map="auto", use_auth_token=os.environ["API_TOKEN"]
|
100 |
)
|
101 |
for name, param in self.llama_model.named_parameters():
|
102 |
param.requires_grad = False
|