Spaces:

MrOvkill
/

MiniChat-3B

Sleeping

Samuel L Meyers commited on Nov 17, 2023

Commit

c17b3f7

•

1 Parent(s): ecd2bcd

Use llama-cpp-python

Files changed (3) hide show

__pycache__/conversation.cpython-311.pyc ADDED Viewed

Binary file (9.27 kB). View file

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ import torch
 from conversation import get_default_conv_template
 import gradio as gr
-from pyllamacpp.model import Model
 import wget
 """
@@ -31,11 +31,11 @@ model_path = "minichat-3b.q8_0.gguf"
 mdlpath = hf_hub_download(repo_id="afrideva/MiniChat-3B-GGUF", filename=model_path)
-lcpp_model = Model(model_path=mdlpath)
 def m3b_talk(text):
     resp = ""
-    for token in lcpp_model.generate(text):
         resp += token
     return resp

 from conversation import get_default_conv_template
 import gradio as gr
+from llama_cpp import Llama
 import wget
 """
 mdlpath = hf_hub_download(repo_id="afrideva/MiniChat-3B-GGUF", filename=model_path)
+lcpp_model = Llama(model_path=mdlpath)
 def m3b_talk(text):
     resp = ""
+    for token in lcpp_model("<s> [|User|]" + text + "</s> [|Assistant|]", stop=["[|User|]", "\n"], echo=True):
         resp += token
     return resp

requirements.txt CHANGED Viewed

@@ -8,5 +8,5 @@ git+https://github.com/huggingface/transformers
 torch
 sentencepiece
 accelerate
-pyllamacpp
 wget

 torch
 sentencepiece
 accelerate
+llama-cpp-python>=0.2.18
 wget