wizardlm-13b-v1-2-q4-0-gguf

Paused

AFischer1985 commited on Dec 21, 2023

Commit

5ff6775

1 Parent(s): b636de7

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -1,23 +1,4 @@
-from llama_cpp.server.app import create_app, Settings
-from fastapi.responses import HTMLResponse
-import os
-app = create_app(
-    Settings(
-        n_threads=2,  # set to number of cpu cores
-        model="model/gguf-model.bin",
-        embedding=False
-    )
-)
-# Read the content of index.html once and store it in memory
-with open("index.html", "r") as f:
-    content = f.read()
-@app.get("/", response_class=HTMLResponse)
-async def read_items():
-    return content
-import uvicorn
-uvicorn.run(app, host=os.environ["HOST"], port=int(os.environ["PORT"]))

+import subprocess
+command = ["python3", "-m", "llama_cpp.server", "--model", "model/gguf-model.bin", "--host", "0.0.0.0", "--port", "2600"]
+subprocess.Popen(command)