import gradio as gr
from transformers import pipeline, set_seed
import os


api_key = os.environ.get("LLama2Secret")
# Your Hugging Face API key


# Initialize the pipeline with the LLaMA 2-7B chat model
model_name = "meta-llama/Llama-2-7b-chat"
# model_name = "meta-llama/Llama-2-7b-chat"
chat_model = pipeline("text2text-generation", model=model_name, use_auth_token=api_key)

def ask_llama2(question):
    set_seed(42)
    responses = chat_model(question, max_length=50)
    return responses[0]['generated_text']

iface = gr.Interface(fn=ask_llama2, inputs="text", outputs="text", title="Chat with LLaMA 2")

iface.launch()