Spaces:
Sleeping
Sleeping
Add KnownModels
Browse files
app.py
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
import gradio as gr
|
2 |
-
from llm_rs import AutoModel,SessionConfig,GenerationConfig,Precision
|
3 |
|
4 |
# https://huggingface.co/TheBloke/open-llama-13b-open-instruct-GGML/blob/main/open-llama-13b-open-instruct.ggmlv3.q8_0.bin
|
5 |
repo_name = "TheBloke/open-llama-13b-open-instruct-GGML"
|
@@ -15,7 +15,7 @@ examples = [
|
|
15 |
]
|
16 |
|
17 |
session_config = SessionConfig(threads=2,batch_size=2)
|
18 |
-
model = AutoModel.from_pretrained(repo_name, model_file=file_name, session_config=session_config,verbose=True)
|
19 |
|
20 |
def process_stream(instruction, temperature, top_p, top_k, max_new_tokens, seed):
|
21 |
|
|
|
1 |
import gradio as gr
|
2 |
+
from llm_rs import AutoModel, SessionConfig, GenerationConfig, Precision, KnownModels
|
3 |
|
4 |
# https://huggingface.co/TheBloke/open-llama-13b-open-instruct-GGML/blob/main/open-llama-13b-open-instruct.ggmlv3.q8_0.bin
|
5 |
repo_name = "TheBloke/open-llama-13b-open-instruct-GGML"
|
|
|
15 |
]
|
16 |
|
17 |
session_config = SessionConfig(threads=2,batch_size=2)
|
18 |
+
model = AutoModel.from_pretrained(repo_name, model_file=file_name, model_type=KnownModels.Llama, session_config=session_config,verbose=True)
|
19 |
|
20 |
def process_stream(instruction, temperature, top_p, top_k, max_new_tokens, seed):
|
21 |
|