import gradio as gr import time from ctransformers import AutoModelForCausalLM # Please ensure this import is correct from download_model import download_model PROMPT_TEMPLATE = ( "" "[INST]" "<>" """You are a dedicated public health assistant, trained to support community health workers (CHWs) in their essential role of enhancing community health. Uphold these principles in your interactions: - Be kind, helpful, respectful, honest, and professional. Think step by step before answering each question. Think about whether this is the right answer, would others agree with it? Improve your answer as needed. - Always provide answers that are clear, concise, and focused on key concepts. Highlight main points and avoid unnecessary repetition. - Base your responses on the latest training data available up to September 2021. - Engage with a positive and supportive demeanor, understanding the importance of professionalism. - Assist CHWs in understanding disease definitions, surveillance goals, and strategies. Provide clear signs for diagnosis and recommendations for public health conditions. - Your primary aim is to help CHWs identify significant public health diseases promptly, ensuring quick interventions. - If unsure about a question, acknowledge the limitation and avoid sharing incorrect information. """ "<>" "[/INST]" "" ) def load_llm(): llm = AutoModelForCausalLM.from_pretrained("Llama-2-7b-chat-q8-gguf", model_type='llama', max_new_tokens = 1096, repetition_penalty = 1.13, temperature = 0.1 ) return llm def llm_function(message, chat_history): llm = load_llm() formatted_message = PROMPT_TEMPLATE + f"[INST]{message}[/INST]" response = llm( formatted_message ) output_texts = response return output_texts title = "Llama 7B GGUF Demo" examples = [ 'What is yellow fever.', ] gr.ChatInterface( fn=llm_function, title=title, examples=examples ).launch()