BramVanroy commited on
Commit
a34b903
1 Parent(s): 70b3775

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -15,7 +15,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "8192"))
15
 
16
  if torch.cuda.is_available():
17
  model_id = "BramVanroy/GEITje-ultra"
18
- model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto")
19
  tokenizer = AutoTokenizer.from_pretrained(model_id)
20
 
21
 
@@ -80,14 +80,14 @@ chat_interface = gr.ChatInterface(
80
  minimum=0.05,
81
  maximum=2,
82
  step=0.05,
83
- value=0.2,
84
  ),
85
  gr.Slider(
86
  label="Top-p (nucleus sampling)",
87
  minimum=0.05,
88
  maximum=1.0,
89
  step=0.05,
90
- value=0.9,
91
  ),
92
  gr.Slider(
93
  label="Top-k",
 
15
 
16
  if torch.cuda.is_available():
17
  model_id = "BramVanroy/GEITje-ultra"
18
+ model = AutoModelForCausalLM.from_pretrained(model_id, load_in_8bit=True, device_map="auto")
19
  tokenizer = AutoTokenizer.from_pretrained(model_id)
20
 
21
 
 
80
  minimum=0.05,
81
  maximum=2,
82
  step=0.05,
83
+ value=1.0,
84
  ),
85
  gr.Slider(
86
  label="Top-p (nucleus sampling)",
87
  minimum=0.05,
88
  maximum=1.0,
89
  step=0.05,
90
+ value=1.0,
91
  ),
92
  gr.Slider(
93
  label="Top-k",