Spaces:

gufett0
/

chatbot-llamaindex

Sleeping

gufett0 commited on Sep 13, 2024

Commit

0865501

1 Parent(s): 8c678cf

removed huggingface_hub

Files changed (1) hide show

backend.py CHANGED Viewed

@@ -13,10 +13,10 @@ from llama_cpp import Llama
 import spaces
-huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
-hf_hub_download(
     repo_id="google/gemma-2-2b-it-GGUF",
     filename="2b_it_v2.gguf",
     local_dir="./models",
@@ -29,20 +29,20 @@ llm = Llama(
             _gpu_layers=81,
             n_batch=1024,
             n_ctx=8192,
-        )
-"""model_id = "google/gemma-2-2b-it"
 tokenizer = GemmaTokenizerFast.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",
     torch_dtype= torch.float16 if torch.cuda.is_available() else torch.float32,
-)"""
 # what models will be used by LlamaIndex:
 Settings.embed_model = InstructorEmbedding(model_name="hkunlp/instructor-base")
-#Settings.llm  = GemmaLLMInterface(model=model, tokenizer=tokenizer)
-Settings.llm  = llm
 ############################---------------------------------

 import spaces
+#huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
+"""hf_hub_download(
     repo_id="google/gemma-2-2b-it-GGUF",
     filename="2b_it_v2.gguf",
     local_dir="./models",
             _gpu_layers=81,
             n_batch=1024,
             n_ctx=8192,
+        )"""
+model_id = "google/gemma-2-2b-it"
 tokenizer = GemmaTokenizerFast.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",
     torch_dtype= torch.float16 if torch.cuda.is_available() else torch.float32,
+)
 # what models will be used by LlamaIndex:
 Settings.embed_model = InstructorEmbedding(model_name="hkunlp/instructor-base")
+Settings.llm  = GemmaLLMInterface(model=model, tokenizer=tokenizer)
+#Settings.llm  = llm
 ############################---------------------------------