Spaces:

AtlaAI
/

judge-arena

Running

App Files Files Community

kaikaidai commited on 8 days ago

Commit

9ca1ad8

verified ·

1 Parent(s): bcd436c

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -11

app.py CHANGED Viewed

@@ -669,7 +669,10 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
         ]
     )
-    # Update the submit function to handle different prompts
     def submit_and_store(
         use_reference,
         eval_criteria_text_input,
@@ -681,7 +684,7 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
         score3_description,
         score4_description,
         score5_description,
-        is_first_game=False
     ):
         # Build prompt data dictionary
         prompt_data = {
@@ -698,35 +701,31 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
         # Get list of active models only for matches
         active_models = [name for name, info in model_data.items()
-                        if info.get("active", True)]  # Default to True for backward compatibility
-        # Modified model selection logic
         atla_model = "Atla-8B-preview-2024-01-08"
         if is_first_game:
-            # For the first game, ensure Atla is one of the models
             other_models = [m for m in active_models if m != atla_model]
             other_model = random.choice(other_models)
-            # Randomly assign Atla to either position A or B
             if random.random() < 0.5:
                 model_a, model_b = atla_model, other_model
             else:
                 model_a, model_b = other_model, atla_model
         else:
-            # For subsequent games, Atla appears 30% of the time
             if random.random() < 0.3:
-                # Include Atla in this battle
                 other_models = [m for m in active_models if m != atla_model]
                 other_model = random.choice(other_models)
-                # Randomly assign Atla to either position A or B
                 if random.random() < 0.5:
                     model_a, model_b = atla_model, other_model
                 else:
                     model_a, model_b = other_model, atla_model
             else:
-                # Battle between two non-Atla models
                 non_atla_models = [m for m in active_models if m != atla_model]
                 model1, model2 = random.sample(non_atla_models, 2)
                 model_a, model_b = (model1, model2) if random.random() < 0.5 else (model2, model1)
@@ -786,6 +785,7 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
             gr.update(value="*Model: Hidden*"),
             gr.update(value="Regenerate judges", variant="secondary", interactive=True),
             gr.update(value="🎲"),  # random_btn
         )
     # Update the click handler to use False for is_first_game after first submission
@@ -802,7 +802,7 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
     # Update the send_btn click handler
     send_btn.click(
-        fn=create_submit_handler(),
         inputs=[
             use_reference_toggle,
             eval_criteria_text,
@@ -814,6 +814,7 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
             score3_description,
             score4_description,
             score5_description,
         ],
         outputs=[
             score_a,
@@ -830,6 +831,7 @@ with gr.Blocks(theme="default", css=CSS_STYLES) as demo:
             model_name_b,
             send_btn,
             random_btn,
         ],
     )

         ]
     )
+    # Add a new state variable to track first game
+    first_game_state = gr.State(True)  # Initialize as True
+    # Update the submit function to use the state variable
     def submit_and_store(
         use_reference,
         eval_criteria_text_input,
         score3_description,
         score4_description,
         score5_description,
+        is_first_game,  # Add state variable as input
     ):
         # Build prompt data dictionary
         prompt_data = {
         # Get list of active models only for matches
         active_models = [name for name, info in model_data.items()
+                        if info.get("active", True)]
         atla_model = "Atla-8B-preview-2024-01-08"
         if is_first_game:
+            # For the first game, ensure new model is one of the models to catch up on votes
             other_models = [m for m in active_models if m != atla_model]
             other_model = random.choice(other_models)
+            # Randomly assign new model to either position A or B
             if random.random() < 0.5:
                 model_a, model_b = atla_model, other_model
             else:
                 model_a, model_b = other_model, atla_model
         else:
+            # For subsequent games, new model appears 30% of the time
             if random.random() < 0.3:
                 other_models = [m for m in active_models if m != atla_model]
                 other_model = random.choice(other_models)
                 if random.random() < 0.5:
                     model_a, model_b = atla_model, other_model
                 else:
                     model_a, model_b = other_model, atla_model
             else:
                 non_atla_models = [m for m in active_models if m != atla_model]
                 model1, model2 = random.sample(non_atla_models, 2)
                 model_a, model_b = (model1, model2) if random.random() < 0.5 else (model2, model1)
             gr.update(value="*Model: Hidden*"),
             gr.update(value="Regenerate judges", variant="secondary", interactive=True),
             gr.update(value="🎲"),  # random_btn
+            False,  # Set first_game_state to False after first submission
         )
     # Update the click handler to use False for is_first_game after first submission
     # Update the send_btn click handler
     send_btn.click(
+        fn=submit_and_store,
         inputs=[
             use_reference_toggle,
             eval_criteria_text,
             score3_description,
             score4_description,
             score5_description,
+            first_game_state,  # Add first_game_state as input
         ],
         outputs=[
             score_a,
             model_name_b,
             send_btn,
             random_btn,
+            first_game_state,  # Add first_game_state as output
         ],
     )