File size: 441 Bytes
fd33676
 
 
 
 
95866c3
 
 
1feb034
fd33676
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
import gradio as gr

import os
import subprocess

from huggingface_hub import hf_hub_download
hf_hub_download(repo_id="bartowski/gemma-2-9b-it-GGUF", filename="gemma-2-9b-it-Q4_K_L.gguf", local_dir="./")

subprocess.run(["python3", "-m", "llama_cpp.server", "--model ./gemma-2-9b-it-Q4_K_L.gguf",  "--host localhost", "--port 8000", "--chat_format gemma"], shell=True)


with gr.Blocks() as demo:
    gr.Markdown("Running...")

demo.launch()