Einfach.Chat

Running

File size: 1,705 Bytes

407db25
 
7742262
 
 
407db25
 
a06d5d0
407db25
ec8492c
a06d5d0
 
4b69801
77b187f
 
 
4b69801
ec8492c
 
 
4b69801
ec8492c
7dda11e
ec8492c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
de849fc
 
ec8492c
de849fc
 
 
b6df80d
de849fc
 
2235d59
de849fc
ec8492c
 
de849fc

import gradio as gr
from huggingface_hub import InferenceClient
import os



client = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
prompt_secret = os.environ.get('PROMPT_SECRET')

def format_prompt(message, history):
    prompt = prompt_secret + "In Ihrer ersten Interaktion fragen Sie nach spezifischen Anforderungen des Entwicklungsprojekts."


    for user_prompt, bot_response in history:
        prompt += f"[INST] {user_prompt} [/INST]"
        prompt += f" {bot_response}</s> "
    prompt += f"[INST] {message} [/INST]</s>"

    return prompt


def generate(
    prompt, history, temperature=0.2, max_new_tokens=512, top_p=0.95, repetition_penalty=1.0,
):
    temperature = float(temperature)
    if temperature < 1e-2:
        temperature = 1e-2
    top_p = float(top_p)

    generate_kwargs = dict(
        temperature=temperature,
        max_new_tokens=max_new_tokens,
        top_p=top_p,
        repetition_penalty=repetition_penalty,
        do_sample=True,
        seed=42,
    )

    formatted_prompt = format_prompt(prompt, history)

    stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
    output = ""

    for response in stream:
        output += response.token.text
        yield output
    return output

mychatbot = gr.Chatbot(
    avatar_images=["./user.png", "./botm.png"], bubble_full_width=False, show_label=False, show_copy_button=True, likeable=True,
)

demo = gr.ChatInterface(
    fn=generate, 
    chatbot=mychatbot,
    title="Einfach Mixtral",
    retry_btn=None,
    undo_btn=None,
    theme="syddharth/gray-minimal"  # Hinzufügen des Themes hier
)

demo.queue().launch(show_api=False)