Spaces:

derek-thomas
/

arabic-RAG

Build error

App Files Files Community

derek-thomas HF staff commited on Nov 16, 2023

Commit

944ee1c

1 Parent(s): e5be074

Adding better error message, and count down.

Browse files

Files changed (1) hide show

backend/query_llm.py +28 -3

backend/query_llm.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import os
 from os import getenv
@@ -19,7 +20,11 @@ def call_jais(payload):
         response.raise_for_status()  # This will raise an exception for HTTP error codes
         return response.json()
     except requests.exceptions.HTTPError as http_err:
-        raise gr.Error(f"An error occurred while processing the request. {http_err}")
     except Exception as err:
         raise gr.Error(f"Check Inference Endpoint Status. An error occurred while processing the request. {err}")
@@ -30,8 +35,14 @@ def generate(prompt: str):
     return response
 def check_endpoint_status():
-    # Replace with the actual API URL and headers
     api_url = os.getenv("ENDPOINT_URL")
     headers = {
         'accept': 'application/json',
@@ -47,6 +58,20 @@ def check_endpoint_status():
         status = data.get('status', {}).get('state', 'No status found')
         message = data.get('status', {}).get('message', 'No message found')
-        return f"Status: {status}\nMessage: {message}"
     except requests.exceptions.RequestException as e:
         return f"Failed to get status: {str(e)}"

+import datetime
 import os
 from os import getenv
         response.raise_for_status()  # This will raise an exception for HTTP error codes
         return response.json()
     except requests.exceptions.HTTPError as http_err:
+        # Check if the error is a 5XX server error
+        if 500 <= http_err.response.status_code < 600:
+            raise gr.Error("The endpoint is loading, it takes about 4 min from the first call.")
+        else:
+            raise gr.Error(f"An error occurred while processing the request. {http_err}")
     except Exception as err:
         raise gr.Error(f"Check Inference Endpoint Status. An error occurred while processing the request. {err}")
     return response
+# Global variable to store the previous status and the time when it changed
+previous_status = None
+status_change_time = None
 def check_endpoint_status():
+    global previous_status, status_change_time
     api_url = os.getenv("ENDPOINT_URL")
     headers = {
         'accept': 'application/json',
         status = data.get('status', {}).get('state', 'No status found')
         message = data.get('status', {}).get('message', 'No message found')
+        # Check if the status has changed
+        if status != previous_status:
+            previous_status = status
+            status_change_time = datetime.datetime.now()
+        # If the previous status was 'scaled to zero' and the current one isn't,
+        # start the countdown
+        countdown_message = ""
+        if status_change_time and previous_status == "scaled to zero" and status != "scaled to zero":
+            elapsed_time = datetime.datetime.now() - status_change_time
+            if elapsed_time < datetime.timedelta(minutes=4):
+                remaining_time = datetime.timedelta(minutes=4) - elapsed_time
+                countdown_message = f"Countdown: {remaining_time} remaining until fully operational."
+        return f"Status: {status}\nMessage: {message}\n{countdown_message}"
     except requests.exceptions.RequestException as e:
         return f"Failed to get status: {str(e)}"