Spaces:

Ashish08
/

Falcon-40B-Instruct-Chat

Runtime error

App Files Files Community

Ashish08 commited on Jul 26, 2023

Commit

030bd8f

1 Parent(s): b1718d1

Create app.py

Browse files

Files changed (1) hide show

app.py +52 -0

app.py ADDED Viewed

	@@ -0,0 +1,52 @@

+import gradio as gr
+from transformers import pipeline
+# pipe = pipeline("text-generation", model="tiiuae/falcon-40b-instruct", trust_remote_code=True)
+def format_chat_prompt(message, chat_history, instruction):
+    prompt = f"System:{instruction}"
+    for turn in chat_history:
+        user_message, bot_message = turn
+        prompt = f"{prompt}\nUser: {user_message}\nAssistant: {bot_message}"
+    prompt = f"{prompt}\nUser: {message}\nAssistant:"
+    return prompt
+def respond(message, chat_history, instruction, temperature=0.7):
+    prompt = format_chat_prompt(message, chat_history, instruction)
+    chat_history = chat_history + [[message, ""]]
+    # stream = client.generate_stream(prompt,
+    #                                   max_new_tokens=1024,
+    #                                   stop_sequences=["\nUser:", "<|endoftext|>"],
+    #                                   temperature=temperature)
+                                      #stop_sequences to not generate the user answer
+    acc_text = ""
+    #Streaming the tokens
+    for idx, response in enumerate(stream):
+            text_token = response.token.text
+            if response.details:
+                return
+            if idx == 0 and text_token.startswith(" "):
+                text_token = text_token[1:]
+            acc_text += text_token
+            last_turn = list(chat_history.pop(-1))
+            last_turn[-1] += acc_text
+            chat_history = chat_history + [last_turn]
+            yield "", chat_history
+            acc_text = ""
+with gr.Blocks() as demo:
+    chatbot = gr.Chatbot(height=240) #just to fit the notebook
+    msg = gr.Textbox(label="Prompt")
+    with gr.Accordion(label="Advanced options",open=False):
+        system = gr.Textbox(label="System message", lines=2, value="A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.")
+        temperature = gr.Slider(label="temperature", minimum=0.1, maximum=1, value=0.7, step=0.1)
+    btn = gr.Button("Submit")
+    clear = gr.ClearButton(components=[msg, chatbot], value="Clear console")
+    btn.click(respond, inputs=[msg, chatbot, system], outputs=[msg, chatbot])
+    msg.submit(respond, inputs=[msg, chatbot, system], outputs=[msg, chatbot]) #Press enter to submit
+gr.close_all()
+demo.queue().launch(share=True, server_port=int(os.environ['PORT4']))