Spaces:

MOHAMMED-N
/

NDMO_Assistant

Running

MOHAMMED-N commited on 7 days ago

Commit

f61ef97

verified ·

1 Parent(s): dadd14f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -59,12 +59,12 @@ def build_vectorstore():
 # --- 3) تحميل النموذج ---
 def load_llm():
     """
-    Downloads the Q4_K_M GGUF model from mobeidat's Hugging Face repository and loads it via llama-cpp.
     """
     # 1) Download the GGUF model from Hugging Face
     model_file = hf_hub_download(
-        repo_id="mobeidat/c4ai-command-r7b-arabic-02-2025-Q4_K_M-GGUF",
-        filename="c4ai-command-r7b-arabic-02-2025-q4_k_m.gguf",
         local_dir="./models",
         local_dir_use_symlinks=False
     )
@@ -73,8 +73,8 @@ def load_llm():
     llm = LlamaCpp(
         model_path=model_file,
         flash_attn=False,
-        n_ctx=2048,  # or 4096 depending on your needs
-        n_batch=512,  # or even 256 depending on your hardware
         chat_format='chatml'
     )

 # --- 3) تحميل النموذج ---
 def load_llm():
     """
+    Downloads a Q4_K_M GGUF model and loads it via llama-cpp.
     """
     # 1) Download the GGUF model from Hugging Face
     model_file = hf_hub_download(
+        repo_id="DevQuasar/CohereForAI.c4ai-command-r7b-arabic-02-2025-GGUF",
+        filename="CohereForAI.c4ai-command-r7b-arabic-02-2025-Q4_K_M.gguf",
         local_dir="./models",
         local_dir_use_symlinks=False
     )
     llm = LlamaCpp(
         model_path=model_file,
         flash_attn=False,
+        n_ctx=2048,  # or 4096
+        n_batch=512,  # or even 256
         chat_format='chatml'
     )