00_Deploy_Practice_Agent_Basics

Running

App Files Files Community

david-clifford commited on 19 days ago

Commit

57d858e

verified ·

1 Parent(s): fa888c9

Further clean up + extending the max_steps now that is seems to be working again.

Browse files

Files changed (1) hide show

app.py +7 -7

app.py CHANGED Viewed

@@ -10,7 +10,7 @@ from Gradio_UI import GradioUI
 verbose = True
-if verbose: print("Running app.py.\n")
 # Below is an example of a tool that does nothing. Amaze us with your creativity !
 @tool
@@ -82,10 +82,8 @@ def get_current_time_in_timezone(timezone: str) -> str:
 final_answer = FinalAnswerTool()
-if verbose: print("Defining MODEL_IDS.\n")
 MODEL_IDS = [
-    'https://wxknx1kg971u7k1n.us-east-1.aws.endpoints.huggingface.cloud/',
     'https://jc26mwg228mkj8dw.us-east-1.aws.endpoints.huggingface.cloud/',
     'meta-llama/Llama-3.2-1B-Instruct',
     'Qwen/Qwen2.5-Coder-32B-Instruct',
@@ -97,6 +95,8 @@ def is_model_overloaded(model_url):
     """Verify if the model is overloaded doing a test call."""
     try:
         response = requests.post(model_url, json={"inputs": "Test"})
         if response.status_code == 503:  # 503 Service Unavailable = Overloaded
             return True
         if response.status_code == 404:  # 404 Client Error: Not Found
@@ -108,12 +108,12 @@ def is_model_overloaded(model_url):
 def get_available_model():
     """Select the first model available from the list."""
     for model_url in MODEL_IDS:
-        print("  trying",model_url,"\n")
         if not is_model_overloaded(model_url):
             return model_url
     return MODEL_IDS[0]  # if all are failing, use the first model by dfault
-if verbose: print("Checking available models.\n")
 selected_model_id = get_available_model()
@@ -136,7 +136,7 @@ with open("prompts.yaml", 'r') as stream:
 agent = CodeAgent(
     model=model,
     tools=[final_answer, get_current_time_in_timezone, image_generation_tool, toss_a_die, nse_stock_price_tool], ## add your tools here (don't remove final answer)
-    max_steps=3,
     verbosity_level=1,
     grammar=None,
     planning_interval=None,

 verbose = True
+if verbose: print("Running app.py")
 # Below is an example of a tool that does nothing. Amaze us with your creativity !
 @tool
 final_answer = FinalAnswerTool()
 MODEL_IDS = [
+    #'https://wxknx1kg971u7k1n.us-east-1.aws.endpoints.huggingface.cloud/',
     'https://jc26mwg228mkj8dw.us-east-1.aws.endpoints.huggingface.cloud/',
     'meta-llama/Llama-3.2-1B-Instruct',
     'Qwen/Qwen2.5-Coder-32B-Instruct',
     """Verify if the model is overloaded doing a test call."""
     try:
         response = requests.post(model_url, json={"inputs": "Test"})
+        if verbose:
+            print(response.status_code)
         if response.status_code == 503:  # 503 Service Unavailable = Overloaded
             return True
         if response.status_code == 404:  # 404 Client Error: Not Found
 def get_available_model():
     """Select the first model available from the list."""
     for model_url in MODEL_IDS:
+        print("trying",model_url)
         if not is_model_overloaded(model_url):
             return model_url
     return MODEL_IDS[0]  # if all are failing, use the first model by dfault
+if verbose: print("Checking available models.")
 selected_model_id = get_available_model()
 agent = CodeAgent(
     model=model,
     tools=[final_answer, get_current_time_in_timezone, image_generation_tool, toss_a_die, nse_stock_price_tool], ## add your tools here (don't remove final answer)
+    max_steps=6,
     verbosity_level=1,
     grammar=None,
     planning_interval=None,