Spaces:

Roastem
/

Sunny

Runtime error

App Files Files Community

Roastem commited on Nov 13, 2023

Commit

1dfc6af

•

1 Parent(s): 3b92a2c

Update app.py - CPU + GPU Inference

Browse files

Files changed (1) hide show

app.py +22 -25

app.py CHANGED Viewed

@@ -1,59 +1,58 @@
 from langchain.llms import CTransformers
 from langchain.chains import LLMChain
-from langchain import PromptTemplate
-import os
-import io
 import gradio as gr
 import time
 custom_prompt_template = """
-You are an AI Chatbot named Sunny, you are created by 'Sic Team' and your task is to provide information to users and chat with them based on given user's query. Below is the user's query.
 Query: {query}
-You just return the helpful message in English and always try to provide relevant answers to user's query.
 """
 def set_custom_prompt():
-    prompt = PromptTemplate(template=custom_prompt_template,
-    input_variables=['query'])
     return prompt
-#Loading the model
 def load_model():
-    # Load the locally downloaded model here
     llm = CTransformers(
-        model = "TheBloke/zephyr-7B-beta-GGUF",
         model_type="llama",
-        max_new_tokens = 1096,
-        temperature = 0.2,
-        repetition_penalty = 1.13,
-        gpu=True,
-        gpu_layers = 3,
     )
     return llm
-print(load_model())
 def chain_pipeline():
     llm = load_model()
     main_prompt = set_custom_prompt()
-    main_chain = LLMChain(
-        prompt=main_prompt,
-        llm=llm
-    )
     return main_chain
 llmchain = chain_pipeline()
 def bot(query):
     llm_response = llmchain.run({"query": query})
     return llm_response
 with gr.Blocks(title='Sunny') as main:
-    # gr.HTML("Code Llama main")
     gr.Markdown("# Sunny Chatbot")
     chatbot = gr.Chatbot([], elem_id="chatbot", height=700)
     msg = gr.Textbox()
@@ -65,8 +64,6 @@ with gr.Blocks(title='Sunny') as main:
         time.sleep(2)
         return "", chat_history
     msg.submit(respond, [msg, chatbot], [msg, chatbot])
-main.launch(share=True)

+import torch
 from langchain.llms import CTransformers
 from langchain.chains import LLMChain
+from langchain import PromptTemplate
 import gradio as gr
 import time
 custom_prompt_template = """
+You are an AI Chatbot named Sunny, created by 'Sic Team', and your task is to provide information to users and chat with them based on given user's query. Below is the user's query.
 Query: {query}
+You just return the helpful message in English and always try to provide relevant answers to the user's query.
 """
 def set_custom_prompt():
+    prompt = PromptTemplate(
+        template=custom_prompt_template, input_variables=['query'])
     return prompt
 def load_model():
+    # Check if GPU is available
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    print(f"Using device: {device}")
+    # Load the locally downloaded model here, specifying the device
     llm = CTransformers(
+        model="TheBloke/zephyr-7B-beta-GGUF",
         model_type="llama",
+        max_new_tokens=1096,
+        temperature=0.2,
+        repetition_penalty=1.13,
+        device=device  # Set the device explicitly during model initialization
     )
     return llm
 def chain_pipeline():
     llm = load_model()
     main_prompt = set_custom_prompt()
+    main_chain = LLMChain(prompt=main_prompt, llm=llm)
     return main_chain
 llmchain = chain_pipeline()
 def bot(query):
     llm_response = llmchain.run({"query": query})
     return llm_response
 with gr.Blocks(title='Sunny') as main:
     gr.Markdown("# Sunny Chatbot")
     chatbot = gr.Chatbot([], elem_id="chatbot", height=700)
     msg = gr.Textbox()
         time.sleep(2)
         return "", chat_history
     msg.submit(respond, [msg, chatbot], [msg, chatbot])
+main.launch(share=False)