Spaces:

ans123
/

Friday

Sleeping

ans123 commited on Nov 2, 2024

Commit

aa5530b

verified ·

1 Parent(s): f205342

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,15 +1,14 @@
 import gradio as gr
 import pandas as pd
 import torch
-import transformers
-# Load the model pipeline
-model_id = "meta-llama/Meta-Llama-3.1-8B-Instruct"
-pipeline = transformers.pipeline(
     "text-generation",
-    model=model_id,
-    model_kwargs={"torch_dtype": torch.bfloat16},
-    device_map="auto",
 )
 # Define the initial system message
@@ -55,17 +54,15 @@ def chat(user_input, messages):
         messages.append({"role": "user", "content": user_input})
         # Prepare the input for the model
-        input_text = messages.copy()  # Make a copy of messages
         # Generate a response using the pipeline
         try:
-            # Convert the messages to a format the model can understand
-            formatted_input = "\n".join([f"{msg['role']}: {msg['content']}" for msg in input_text])
-            response = pipeline(formatted_input, max_new_tokens=256)
             # Extract the assistant's response
-            response_content = response[0]["generated_text"].strip()
             # Store assistant response in the chat history
             messages.append({"role": "assistant", "content": response_content})
@@ -77,7 +74,7 @@ def chat(user_input, messages):
 # Gradio Interface
 with gr.Blocks() as demo:
-    gr.Markdown("## Fashion Assistant Chatbot")
     # Sidebar for user inputs
     with gr.Row():

 import gradio as gr
 import pandas as pd
 import torch
+from transformers import pipeline
+# Load the Zephyr-7B-Beta model pipeline
+pipe = pipeline(
     "text-generation",
+    model="HuggingFaceH4/zephyr-7b-beta",
+    torch_dtype=torch.bfloat16,
+    device_map="auto"
 )
 # Define the initial system message
         messages.append({"role": "user", "content": user_input})
         # Prepare the input for the model
+        input_text = "\n".join([f"{msg['role']}: {msg['content']}" for msg in messages])
         # Generate a response using the pipeline
         try:
+            response = pipe(input_text, max_new_tokens=256, return_full_text=False)
             # Extract the assistant's response
+            response_content = response[0]['generated_text'].strip()
             # Store assistant response in the chat history
             messages.append({"role": "assistant", "content": response_content})
 # Gradio Interface
 with gr.Blocks() as demo:
+    gr.Markdown("## FRIDAY")
     # Sidebar for user inputs
     with gr.Row():