Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -2,18 +2,6 @@ import os
|
|
2 |
import spaces
|
3 |
import torch
|
4 |
import gradio as gr
|
5 |
-
from huggingface_hub import snapshot_download, login
|
6 |
-
from transformers.utils import move_cache
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
LLM_MODEL_DIR = '/model'
|
12 |
-
LLM_MODEL_ID = "mistral-community/Mistral-7B-v0.2"
|
13 |
-
LLM_MODEL_REVISION = 'main'
|
14 |
-
os.makedirs(LLM_MODEL_DIR, exist_ok=True)
|
15 |
-
snapshot_download(LLM_MODEL_ID, revision=LLM_MODEL_REVISION, local_dir=LLM_MODEL_DIR) #, token=HF_TOKEN)
|
16 |
-
move_cache()
|
17 |
|
18 |
|
19 |
# cpu
|
@@ -28,6 +16,12 @@ print(zero.device) # <-- 'cpu' 🤔
|
|
28 |
def greet(user):
|
29 |
# print(zero.device) # <-- 'cuda:0' 🤗
|
30 |
from vllm import SamplingParams, LLM
|
|
|
|
|
|
|
|
|
|
|
|
|
31 |
|
32 |
model = LLM(LLM_MODEL_DIR)
|
33 |
sampling_params = dict(
|
|
|
2 |
import spaces
|
3 |
import torch
|
4 |
import gradio as gr
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5 |
|
6 |
|
7 |
# cpu
|
|
|
16 |
def greet(user):
|
17 |
# print(zero.device) # <-- 'cuda:0' 🤗
|
18 |
from vllm import SamplingParams, LLM
|
19 |
+
from transformers.utils import move_cache
|
20 |
+
from huggingface_hub import snapshot_download, login
|
21 |
+
|
22 |
+
LLM_MODEL_ID = "mistral-community/Mistral-7B-v0.2"
|
23 |
+
fp = snapshot_download(LLM_MODEL_ID)
|
24 |
+
move_cache()
|
25 |
|
26 |
model = LLM(LLM_MODEL_DIR)
|
27 |
sampling_params = dict(
|