Spaces:

Futuresony
/

FuturesonyAi

Running

App Files Files Community

Futuresony commited on Feb 5

Commit

669f0b6

verified ·

1 Parent(s): 3d06565

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -13

app.py CHANGED Viewed

@@ -1,11 +1,22 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
 client = InferenceClient("Futuresony/future_ai_12_10_2024.gguf")
 def respond(
     message,
@@ -26,23 +37,30 @@ def respond(
     messages.append({"role": "user", "content": message})
     response = ""
-    for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
-        stream=True,
         temperature=temperature,
         top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
         response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
@@ -59,6 +77,6 @@ demo = gr.ChatInterface(
     ],
 )
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
 from huggingface_hub import InferenceClient
+from web import search  # Web search for fetching real-time answers
 client = InferenceClient("Futuresony/future_ai_12_10_2024.gguf")
+# Define topics that your model was NOT fine-tuned on
+OUT_OF_SCOPE_TOPICS = ["current events", "latest news", "sports scores", "politics", "celebrity gossip"]
+def is_out_of_scope(question):
+    """Check if the question relates to topics the model wasn't trained on."""
+    return any(topic in question.lower() for topic in OUT_OF_SCOPE_TOPICS)
+def google_search(query):
+    """Fetch search results from Google."""
+    results = search(query)
+    if results:
+        return results[0]  # Return the first result
+    return "Sorry, I couldn't find an answer on Google."
 def respond(
     message,
     messages.append({"role": "user", "content": message})
     response = ""
+    response_obj = client.chat_completion(
         messages,
         max_tokens=max_tokens,
         temperature=temperature,
         top_p=top_p,
+        logprobs=True,  # Get log probabilities to measure uncertainty
+    )
+    # Extract response text
+    for message in response_obj:
+        token = message.choices[0].delta.content
         response += token
+        yield response  # Stream response
+    # Analyze uncertainty (using log probabilities)
+    logprobs = response_obj.choices[0].logprobs.token_logprobs
+    avg_confidence = sum(logprobs) / len(logprobs) if logprobs else 0
+    # If confidence is low OR the question is about out-of-scope topics, use Google
+    if avg_confidence < -5 or is_out_of_scope(message):
+        google_response = google_search(message)
+        yield f"🤖 AI (Low confidence): {response}\n\n🌍 Google: {google_response}"
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
     ],
 )
 if __name__ == "__main__":
     demo.launch()