Tonic commited on
Commit
d755450
·
1 Parent(s): 0d2403d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -6
app.py CHANGED
@@ -28,11 +28,10 @@ class OrcaChatBot:
28
  self.model = model
29
  self.tokenizer = tokenizer
30
  self.system_message = system_message
31
- self.conversation_history = None
32
 
33
  def predict(self, user_message, temperature=0.4, max_new_tokens=70, top_p=0.99, repetition_penalty=1.9):
34
  # Prepare the prompt
35
- prompt = f"<|im_start|>system\n{self.system_message}<|im_end|>\n<|im_start|>user\n{user_message}<|im_end|>\n<|im_start|>assistant" if self.conversation_history is None else self.conversation_history + f"<|im_end|>\n<|im_start|>user\n{user_message}<|im_end|>\n<|im_start|>assistant"
36
 
37
  # Encode the prompt
38
  inputs = self.tokenizer(prompt, return_tensors='pt', add_special_tokens=False)
@@ -48,14 +47,10 @@ class OrcaChatBot:
48
  pad_token_id=self.tokenizer.eos_token_id,
49
  do_sample=True # Enable sampling-based generation
50
  )
51
-
52
 
53
  # Decode the generated response
54
  response = self.tokenizer.decode(output_ids[0], skip_special_tokens=True)
55
 
56
- # Update conversation history
57
- self.conversation_history = self.tokenizer.decode(output_ids[0], skip_special_tokens=False)
58
-
59
  return response
60
 
61
  Orca_bot = OrcaChatBot(model, tokenizer)
 
28
  self.model = model
29
  self.tokenizer = tokenizer
30
  self.system_message = system_message
 
31
 
32
  def predict(self, user_message, temperature=0.4, max_new_tokens=70, top_p=0.99, repetition_penalty=1.9):
33
  # Prepare the prompt
34
+ prompt = f"system\n{self.system_message}\nuser\n{user_message}\nassistant"
35
 
36
  # Encode the prompt
37
  inputs = self.tokenizer(prompt, return_tensors='pt', add_special_tokens=False)
 
47
  pad_token_id=self.tokenizer.eos_token_id,
48
  do_sample=True # Enable sampling-based generation
49
  )
 
50
 
51
  # Decode the generated response
52
  response = self.tokenizer.decode(output_ids[0], skip_special_tokens=True)
53
 
 
 
 
54
  return response
55
 
56
  Orca_bot = OrcaChatBot(model, tokenizer)