import os import streamlit as st # Install dependencies if not already installed os.system('pip install transformers torch') from transformers import AutoTokenizer, AutoModelForCausalLM # Show title and description. st.title("💬 Healthcare Chatbot") st.write( "This is a simple chatbot that uses the Llama3-Med42-8B model to generate responses. " "To use this app, simply type your question in the input field below." ) # Create a session state variable to store the chat messages. This ensures that the # messages persist across reruns. if "messages" not in st.session_state: st.session_state.messages = [] # Display the existing chat messages via `st.chat_message`. for message in st.session_state.messages: with st.chat_message(message["role"]): st.markdown(message["content"]) # Načtení modelu a tokenizeru model_name = "m42-health/Llama3-Med42-8B" tokenizer = AutoTokenizer.from_pretrained(model_name) model = AutoModelForCausalLM.from_pretrained(model_name) # Create a chat input field to allow the user to enter a message. This will display # automatically at the bottom of the page. if user_input := st.chat_input("What is up?"): # Store and display the current prompt. st.session_state.messages.append({"role": "user", "content": user_input}) with st.chat_message("user"): st.markdown(user_input) # Prepare input for the model messages = [ {"role": "system", "content": ( "You are a helpful, respectful and honest medical assistant. " "Always answer as helpfully as possible, while being safe. " "Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. " "Please ensure that your responses are socially unbiased and positive in nature. " "If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. " "If you don’t know the answer to a question, please don’t share false information." )}, {"role": "user", "content": user_input} ] input_text = " ".join([f"{message['role']}: {message['content']}" for message in messages]) input_ids = tokenizer.encode(input_text, return_tensors="pt") # Vygenerování odpovědi output_ids = model.generate(input_ids, max_length=512, do_sample=True, temperature=0.4, top_k=150, top_p=0.75) response = tokenizer.decode(output_ids[0], skip_special_tokens=True) # Display the model's response with st.chat_message("assistant"): st.markdown(response[len(input_text):]) st.session_state.messages.append({"role": "assistant", "content": response[len(input_text):]})