Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -26,13 +26,19 @@ def load_model(model_name):
|
|
26 |
global model, tokenizer
|
27 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
28 |
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="cpu", attn_implementation="eager")
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
return f"Modèle {model_name} chargé avec succès sur CPU."
|
30 |
|
31 |
@spaces.GPU(duration=300)
|
32 |
def generate_text(input_text, temperature, top_p, top_k):
|
33 |
global model, tokenizer
|
34 |
|
35 |
-
inputs = tokenizer(input_text, return_tensors="pt", padding=True)
|
36 |
input_ids = inputs["input_ids"]
|
37 |
attention_mask = inputs["attention_mask"]
|
38 |
|
|
|
26 |
global model, tokenizer
|
27 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
28 |
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="cpu", attn_implementation="eager")
|
29 |
+
|
30 |
+
# Définir le token de padding s'il n'existe pas
|
31 |
+
if tokenizer.pad_token is None:
|
32 |
+
tokenizer.pad_token = tokenizer.eos_token
|
33 |
+
model.config.pad_token_id = model.config.eos_token_id
|
34 |
+
|
35 |
return f"Modèle {model_name} chargé avec succès sur CPU."
|
36 |
|
37 |
@spaces.GPU(duration=300)
|
38 |
def generate_text(input_text, temperature, top_p, top_k):
|
39 |
global model, tokenizer
|
40 |
|
41 |
+
inputs = tokenizer(input_text, return_tensors="pt", padding=True, truncation=True, max_length=512)
|
42 |
input_ids = inputs["input_ids"]
|
43 |
attention_mask = inputs["attention_mask"]
|
44 |
|