Carlos Rosas commited on
Commit
3db8a39
·
verified ·
1 Parent(s): aa81522

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -10
app.py CHANGED
@@ -13,14 +13,6 @@ import pandas as pd
13
  # Define the device
14
  device = "cuda" if torch.cuda.is_available() else "cpu"
15
 
16
- # Define variables
17
- temperature = 0.0
18
- max_new_tokens = 1500
19
- top_p = 0.95
20
- repetition_penalty = 1.0
21
- min_new_tokens = 800
22
- early_stopping = False
23
-
24
  model_name = "PleIAs/Pleias-Rag"
25
 
26
  # Get Hugging Face token from environment variable
@@ -34,9 +26,19 @@ model = AutoModelForCausalLM.from_pretrained(model_name, token=hf_token)
34
  model.to(device)
35
 
36
  # Set tokenizer configuration
37
- tokenizer.pad_token = tokenizer.eos_token
38
- tokenizer.pad_token_id = tokenizer.eos_token_id
39
  tokenizer.eos_token = "<|answer_end|>"
 
 
 
 
 
 
 
 
 
 
 
40
 
41
  # Connect to the LanceDB database
42
  db = lancedb.connect("content 5/lancedb_data")
 
13
  # Define the device
14
  device = "cuda" if torch.cuda.is_available() else "cpu"
15
 
 
 
 
 
 
 
 
 
16
  model_name = "PleIAs/Pleias-Rag"
17
 
18
  # Get Hugging Face token from environment variable
 
26
  model.to(device)
27
 
28
  # Set tokenizer configuration
29
+
 
30
  tokenizer.eos_token = "<|answer_end|>"
31
+ eos_token_id=tokenizer.eos_token_id
32
+ tokenizer.pad_token = tokenizer.eos_token
33
+ tokenizer.pad_token_id = 1
34
+
35
+ # Define variables
36
+ temperature = 0.0
37
+ max_new_tokens = 1500
38
+ top_p = 0.95
39
+ repetition_penalty = 1.0
40
+ min_new_tokens = 800
41
+ early_stopping = False
42
 
43
  # Connect to the LanceDB database
44
  db = lancedb.connect("content 5/lancedb_data")