Spaces:

project-baize
/

chat-with-baize

Runtime error

project-baize commited on Apr 4, 2023

Commit

e0ec530

•

1 Parent(s): 9d96329

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -35,14 +35,14 @@ def predict(text,
         return
     inputs = generate_prompt_with_history(text,history,tokenizer,max_length=max_context_length_tokens)
-    if inputs is False:
-        yield chatbot+[[text,"Sorry, the input is too long."]],history,"Generate Fail"
-        return
     else:
         prompt,inputs=inputs
         begin_length = len(prompt)
     torch.cuda.empty_cache()
-    input_ids = inputs["input_ids"].to(device)
     global total_count
     total_count += 1
     print(total_count)
@@ -63,6 +63,7 @@ def predict(text,
                     return
                 except:
                     pass
     #print(text)
     #print(x)
     #print("="*80)
@@ -150,7 +151,7 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
                     )
                     max_context_length_tokens = gr.Slider(
                         minimum=0,
-                        maximum=4096,
                         value=2048,
                         step=128,
                         interactive=True,

         return
     inputs = generate_prompt_with_history(text,history,tokenizer,max_length=max_context_length_tokens)
+    if inputs is None:
+        yield chatbot,history,"Too Long Input"
+        return
     else:
         prompt,inputs=inputs
         begin_length = len(prompt)
+    input_ids = inputs["input_ids"][:,-max_context_length_tokens:].to(device)
     torch.cuda.empty_cache()
     global total_count
     total_count += 1
     print(total_count)
                     return
                 except:
                     pass
+    torch.cuda.empty_cache()
     #print(text)
     #print(x)
     #print("="*80)
                     )
                     max_context_length_tokens = gr.Slider(
                         minimum=0,
+                        maximum=3072,
                         value=2048,
                         step=128,
                         interactive=True,