Spaces:
Runtime error
Runtime error
fix: workaround for ORTModel that cant't access private repository even with an auth token
Browse files
app.py
CHANGED
@@ -6,6 +6,8 @@ import torch
|
|
6 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
7 |
from optimum.onnxruntime import ORTModelForCausalLM
|
8 |
|
|
|
|
|
9 |
import gradio as gr
|
10 |
|
11 |
MODEL_NAME = (
|
@@ -15,26 +17,24 @@ MODEL_NAME = (
|
|
15 |
)
|
16 |
HF_READ_TOKEN = os.environ.get("HF_READ_TOKEN")
|
17 |
|
|
|
|
|
18 |
assert isinstance(MODEL_NAME, str)
|
19 |
|
20 |
tokenizer = AutoTokenizer.from_pretrained(
|
21 |
MODEL_NAME,
|
22 |
trust_remote_code=True,
|
23 |
-
token=HF_READ_TOKEN,
|
24 |
)
|
25 |
model = {
|
26 |
"default": AutoModelForCausalLM.from_pretrained(
|
27 |
MODEL_NAME,
|
28 |
-
token=HF_READ_TOKEN,
|
29 |
),
|
30 |
"ort": ORTModelForCausalLM.from_pretrained(
|
31 |
MODEL_NAME,
|
32 |
-
use_auth_token=HF_READ_TOKEN,
|
33 |
),
|
34 |
"ort_qantized": ORTModelForCausalLM.from_pretrained(
|
35 |
MODEL_NAME,
|
36 |
file_name="model_quantized.onnx",
|
37 |
-
use_auth_token=HF_READ_TOKEN,
|
38 |
),
|
39 |
}
|
40 |
|
@@ -676,7 +676,7 @@ def demo():
|
|
676 |
)
|
677 |
|
678 |
ui.launch(
|
679 |
-
share=True,
|
680 |
)
|
681 |
|
682 |
|
|
|
6 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
7 |
from optimum.onnxruntime import ORTModelForCausalLM
|
8 |
|
9 |
+
from huggingface_hub import login
|
10 |
+
|
11 |
import gradio as gr
|
12 |
|
13 |
MODEL_NAME = (
|
|
|
17 |
)
|
18 |
HF_READ_TOKEN = os.environ.get("HF_READ_TOKEN")
|
19 |
|
20 |
+
login(HF_READ_TOKEN)
|
21 |
+
|
22 |
assert isinstance(MODEL_NAME, str)
|
23 |
|
24 |
tokenizer = AutoTokenizer.from_pretrained(
|
25 |
MODEL_NAME,
|
26 |
trust_remote_code=True,
|
|
|
27 |
)
|
28 |
model = {
|
29 |
"default": AutoModelForCausalLM.from_pretrained(
|
30 |
MODEL_NAME,
|
|
|
31 |
),
|
32 |
"ort": ORTModelForCausalLM.from_pretrained(
|
33 |
MODEL_NAME,
|
|
|
34 |
),
|
35 |
"ort_qantized": ORTModelForCausalLM.from_pretrained(
|
36 |
MODEL_NAME,
|
37 |
file_name="model_quantized.onnx",
|
|
|
38 |
),
|
39 |
}
|
40 |
|
|
|
676 |
)
|
677 |
|
678 |
ui.launch(
|
679 |
+
# share=True,
|
680 |
)
|
681 |
|
682 |
|