BAAI
/

AquilaChat2-34B

Text Generation

Model card Files Files and versions Community

ldwang commited on Oct 17, 2023

Commit

cde5d63

•

1 Parent(s): eb27b1a

Upload predict.py

Files changed (1) hide show

predict.py +7 -1

predict.py CHANGED Viewed

@@ -333,6 +333,7 @@ def predict(model, text, tokenizer=None,
             sft=True, convo_template = "",
             device = "cuda",
             model_name="AquilaChat2-7B",
             **kwargs):
     vocab = tokenizer.get_vocab()
@@ -352,7 +353,7 @@ def predict(model, text, tokenizer=None,
         topk = 1
         temperature = 1.0
     if sft:
-        tokens = covert_prompt_to_input_ids_with_history(text, history=[], tokenizer=tokenizer, max_token=2048, convo_template=convo_template)
         tokens = torch.tensor(tokens)[None,].to(device)
     else :
         tokens = tokenizer.encode_plus(text)["input_ids"]
@@ -433,4 +434,9 @@ def predict(model, text, tokenizer=None,
         convert_tokens = convert_tokens[1:]
         probs = probs[1:]
     return out

             sft=True, convo_template = "",
             device = "cuda",
             model_name="AquilaChat2-7B",
+            history=[],
             **kwargs):
     vocab = tokenizer.get_vocab()
         topk = 1
         temperature = 1.0
     if sft:
+        tokens = covert_prompt_to_input_ids_with_history(text, history=history, tokenizer=tokenizer, max_token=2048, convo_template=convo_template)
         tokens = torch.tensor(tokens)[None,].to(device)
     else :
         tokens = tokenizer.encode_plus(text)["input_ids"]
         convert_tokens = convert_tokens[1:]
         probs = probs[1:]
+    # Update history
+    history.insert(0, ('USER', text))
+    history.insert(0, ('ASSISTANT', out))
     return out