Spaces:
Running
on
Zero
Running
on
Zero
BramVanroy
commited on
Commit
•
a34b903
1
Parent(s):
70b3775
Update app.py
Browse files
app.py
CHANGED
@@ -15,7 +15,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "8192"))
|
|
15 |
|
16 |
if torch.cuda.is_available():
|
17 |
model_id = "BramVanroy/GEITje-ultra"
|
18 |
-
model = AutoModelForCausalLM.from_pretrained(model_id,
|
19 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
20 |
|
21 |
|
@@ -80,14 +80,14 @@ chat_interface = gr.ChatInterface(
|
|
80 |
minimum=0.05,
|
81 |
maximum=2,
|
82 |
step=0.05,
|
83 |
-
value=0
|
84 |
),
|
85 |
gr.Slider(
|
86 |
label="Top-p (nucleus sampling)",
|
87 |
minimum=0.05,
|
88 |
maximum=1.0,
|
89 |
step=0.05,
|
90 |
-
value=0
|
91 |
),
|
92 |
gr.Slider(
|
93 |
label="Top-k",
|
|
|
15 |
|
16 |
if torch.cuda.is_available():
|
17 |
model_id = "BramVanroy/GEITje-ultra"
|
18 |
+
model = AutoModelForCausalLM.from_pretrained(model_id, load_in_8bit=True, device_map="auto")
|
19 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
20 |
|
21 |
|
|
|
80 |
minimum=0.05,
|
81 |
maximum=2,
|
82 |
step=0.05,
|
83 |
+
value=1.0,
|
84 |
),
|
85 |
gr.Slider(
|
86 |
label="Top-p (nucleus sampling)",
|
87 |
minimum=0.05,
|
88 |
maximum=1.0,
|
89 |
step=0.05,
|
90 |
+
value=1.0,
|
91 |
),
|
92 |
gr.Slider(
|
93 |
label="Top-k",
|