Spaces:

samunder12
/

hellome

Sleeping

samunder12 commited on Jun 29, 2024

Commit

3dce9ee

verified ·

1 Parent(s): 233b050

hello

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,7 @@
 import gradio as gr
-from transformers import pipeline
-# Load the model
-pipe = pipeline("text-generation", model="KoboldAI/fairseq-dense-13B-Shinen")
 def respond(
     message,
@@ -19,13 +18,13 @@ def respond(
     prompt += f"Human: {message}\nAI:"
     # Generate response
-    response = pipe(
         prompt,
-        max_length=len(prompt.split()) + max_tokens,
         temperature=temperature,
         top_p=top_p,
         do_sample=True,
-    )[0]['generated_text']
     # Extract only the AI's response
     ai_response = response.split("AI:")[-1].strip()

 import gradio as gr
+from huggingface_hub import InferenceClient
+client = InferenceClient("KoboldAI/fairseq-dense-13B-Shinen")
 def respond(
     message,
     prompt += f"Human: {message}\nAI:"
     # Generate response
+    response = client.text_generation(
         prompt,
+        max_new_tokens=max_tokens,
         temperature=temperature,
         top_p=top_p,
         do_sample=True,
+    )
     # Extract only the AI's response
     ai_response = response.split("AI:")[-1].strip()