Spaces:

Ahren09
/

AgentReview

Running

App Files Files Community

USTC975 commited on Nov 6, 2024

Commit

a06e98d

1 Parent(s): 1d838f0

build gradio app

Browse files

Files changed (8) hide show

agentreview/backends/openai.py +1 -0
agentreview/environments/paper_review.py +3 -6
agentreview/paper_review_arena.py +1 -0
agentreview/paper_review_message.py +1 -2
agentreview/paper_review_player.py +16 -5
agentreview/utility/authentication_utils.py +7 -7
app.py +610 -4
template.py +576 -0

agentreview/backends/openai.py CHANGED Viewed

@@ -64,6 +64,7 @@ class OpenAIChat(IntelligenceBackend):
     def _get_response(self, messages):
         # Refer to https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/switching-endpoints for how to
         # make API calls
         if self.client_type == "openai":
             completion = self.client.chat.completions.create(

     def _get_response(self, messages):
         # Refer to https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/switching-endpoints for how to
         # make API calls
+        return 'hello'  # FIXME: remove this line
         if self.client_type == "openai":
             completion = self.client.chat.completions.create(

agentreview/environments/paper_review.py CHANGED Viewed

@@ -57,7 +57,7 @@ class PaperReview(Conversation):
         if self._phases is not None:
             return self._phases
         reviewer_names = [name for name in self.player_names if name.startswith("Reviewer")]
         num_reviewers = len(reviewer_names)
@@ -180,13 +180,10 @@ class PaperReview(Conversation):
                            "Phase V. (AC makes decisions).")
             else:
-                logger.info(f"Phase {self.phase_index}: end of the speaking order. Move to Phase ({self.phase_index + 1}).")
                 self.phase_index += 1
                 self._current_turn += 1
         else:
             self._next_player_index += 1
@@ -200,7 +197,7 @@ class PaperReview(Conversation):
     def get_next_player(self) -> str:
         """Get the next player in the current phase."""
-        speaking_order = self.phases[self.phase_index]["speaking_order"]
         next_player = speaking_order[self._next_player_index]
         return next_player

         if self._phases is not None:
             return self._phases
         reviewer_names = [name for name in self.player_names if name.startswith("Reviewer")]
         num_reviewers = len(reviewer_names)
                            "Phase V. (AC makes decisions).")
             else:
+                print(f"Phase {self.phase_index}: end of the speaking order. Move to Phase ({self.phase_index + 1}).")
                 self.phase_index += 1
                 self._current_turn += 1
         else:
             self._next_player_index += 1
     def get_next_player(self) -> str:
         """Get the next player in the current phase."""
+        speaking_order = self.phases[self.phase_index]["speaking_order"]
         next_player = speaking_order[self._next_player_index]
         return next_player

agentreview/paper_review_arena.py CHANGED Viewed

@@ -101,6 +101,7 @@ class PaperReviewArena(Arena):
                 player.role_desc = get_reviewer_description(phase="reviewer_ac_discussion",
                                                             **self.environment.experiment_setting["players"][
                                                                 'Reviewer'][reviewer_index - 1])
             elif self.environment.phase_index == 5:  # Phase 5 AC Makes Decisions

                 player.role_desc = get_reviewer_description(phase="reviewer_ac_discussion",
                                                             **self.environment.experiment_setting["players"][
                                                                 'Reviewer'][reviewer_index - 1])
             elif self.environment.phase_index == 5:  # Phase 5 AC Makes Decisions

agentreview/paper_review_message.py CHANGED Viewed

@@ -60,7 +60,7 @@ class PaperReviewMessagePool(MessagePool):
                 visible_messages = []
         elif phase_index == 4:
-            if agent_name.startswith("AC"):
                 area_chair_type = self.experiment_setting['players']['AC'][0]["area_chair_type"]
                 # 'BASELINE' means we do not specify the area chair's characteristics in the config file
@@ -86,7 +86,6 @@ class PaperReviewMessagePool(MessagePool):
                 else:
                     raise ValueError(f"Unknown Area chair type: {area_chair_type}.")
         else:
             visible_messages = []

                 visible_messages = []
         elif phase_index == 4:
+            if agent_name.startswith("AC"):
                 area_chair_type = self.experiment_setting['players']['AC'][0]["area_chair_type"]
                 # 'BASELINE' means we do not specify the area chair's characteristics in the config file
                 else:
                     raise ValueError(f"Unknown Area chair type: {area_chair_type}.")
         else:
             visible_messages = []

agentreview/paper_review_player.py CHANGED Viewed

@@ -78,6 +78,7 @@ class PaperExtractorPlayer(Player):
             paper_decision: str,
             conference: str,
             backend: Union[BackendConfig, IntelligenceBackend],
             global_prompt: str = None,
             **kwargs,
     ):
@@ -85,6 +86,9 @@ class PaperExtractorPlayer(Player):
         self.paper_id = paper_id
         self.paper_decision = paper_decision
         self.conference: str = conference
     def act(self, observation: List[Message]) -> str:
         """
@@ -96,12 +100,17 @@ class PaperExtractorPlayer(Player):
         Returns:
             str: The action (response) of the player.
         """
-        logging.info(f"Loading {self.conference} paper {self.paper_id} ({self.paper_decision}) ...")
         loader = PDFReader()
-        document_path = Path(os.path.join(self.args.data_dir, self.conference, "paper", self.paper_decision,
-                                          f"{self.paper_id}.pdf"))  #
         documents = loader.load_data(file=document_path)
         num_words = 0
@@ -118,5 +127,7 @@ class PaperExtractorPlayer(Player):
             main_contents += text + ' '
             if FLAG:
                 break
         return main_contents

             paper_decision: str,
             conference: str,
             backend: Union[BackendConfig, IntelligenceBackend],
+            paper_pdf_path: str = None,
             global_prompt: str = None,
             **kwargs,
     ):
         self.paper_id = paper_id
         self.paper_decision = paper_decision
         self.conference: str = conference
+        if paper_pdf_path is not None:
+            self.paper_pdf_path = paper_pdf_path
     def act(self, observation: List[Message]) -> str:
         """
         Returns:
             str: The action (response) of the player.
         """
+        if self.paper_pdf_path is not None:
+            logging.info(f"Loading paper from {self.paper_pdf_path} ...")
+        else:
+            logging.info(f"Loading {self.conference} paper {self.paper_id} ({self.paper_decision}) ...")
         loader = PDFReader()
+        if self.paper_pdf_path is not None:
+            document_path = Path(self.paper_pdf_path)
+        else:
+            document_path = Path(os.path.join(self.args.data_dir, self.conference, "paper", self.paper_decision,
+                                            f"{self.paper_id}.pdf"))  #
         documents = loader.load_data(file=document_path)
         num_words = 0
             main_contents += text + ' '
             if FLAG:
                 break
+        print(main_contents)
         return main_contents

agentreview/utility/authentication_utils.py CHANGED Viewed

@@ -16,13 +16,6 @@ def get_openai_client(client_type: str):
     assert client_type in ["azure_openai", "openai"]
-    endpoint: str = os.environ['AZURE_ENDPOINT']
-    if not endpoint.startswith("https://"):
-        endpoint = f"https://{endpoint}.openai.azure.com"
-    os.environ['AZURE_ENDPOINT'] = endpoint
     if not os.environ.get('OPENAI_API_VERSION'):
         os.environ['OPENAI_API_VERSION'] = "2023-05-15"
@@ -32,6 +25,13 @@ def get_openai_client(client_type: str):
         )
     elif client_type == "azure_openai":
         client = openai.AzureOpenAI(
             api_key=os.environ['AZURE_OPENAI_KEY'],
             azure_endpoint=os.environ['AZURE_ENDPOINT'],  # f"https://YOUR_END_POINT.openai.azure.com"

     assert client_type in ["azure_openai", "openai"]
     if not os.environ.get('OPENAI_API_VERSION'):
         os.environ['OPENAI_API_VERSION'] = "2023-05-15"
         )
     elif client_type == "azure_openai":
+        endpoint: str = os.environ['AZURE_ENDPOINT']
+        if not endpoint.startswith("https://"):
+            endpoint = f"https://{endpoint}.openai.azure.com"
+        os.environ['AZURE_ENDPOINT'] = endpoint
         client = openai.AzureOpenAI(
             api_key=os.environ['AZURE_OPENAI_KEY'],
             azure_endpoint=os.environ['AZURE_ENDPOINT'],  # f"https://YOUR_END_POINT.openai.azure.com"

app.py CHANGED Viewed

@@ -1,7 +1,613 @@
 import gradio as gr
-def echo_text(text):
-    return text
-iface = gr.Interface(fn=echo_text, inputs="text", outputs="text")
-iface.launch()

+import json
+import re
+from glob import glob
+from argparse import Namespace
 import gradio as gr
+from agentreview import const
+from agentreview.config import AgentConfig
+from agentreview.agent import Player
+from agentreview.backends import BACKEND_REGISTRY
+from agentreview.environments import PaperReview
+from agentreview.paper_review_arena import PaperReviewArena
+from agentreview.utility.experiment_utils import initialize_players
+from agentreview.paper_review_player import PaperExtractorPlayer, AreaChair, Reviewer
+from agentreview.role_descriptions import get_reviewer_description, get_ac_description, get_author_config, get_paper_extractor_config
+# 该文件的使命是前端交互：构建前端页面，从页面中获取用户的配置，传入后端运行，将结果实时展示到相应模块
+css = """#col-container {max-width: 90%; margin-left: auto; margin-right: auto; display: flex; flex-direction: column;}
+#header {text-align: center;}
+#col-chatbox {flex: 1; max-height: min(900px, 100%);}
+#label {font-size: 2em; padding: 0.5em; margin: 0;}
+.message {font-size: 1.2em;}
+.message-wrap {max-height: min(700px, 100vh);}
+"""
+# .wrap {min-width: min(640px, 100vh)}
+# #env-desc {max-height: 100px; overflow-y: auto;}
+# .textarea {height: 100px; max-height: 100px;}
+# #chatbot-tab-all {height: 750px; max-height: min(750px, 100%);}
+# #chatbox {height: min(750px, 100%); max-height: min(750px, 100%);}
+# #chatbox.block {height: 730px}
+# .wrap {max-height: 680px;}
+# .scroll-hide {overflow-y: scroll; max-height: 100px;}
+DEBUG = False
+DEFAULT_BACKEND = "openai-chat"
+MAX_NUM_PLAYERS = 4
+DEFAULT_NUM_PLAYERS = 4
+CURRENT_STEP_INDEX = 0
+def load_examples():
+    example_configs = {}
+    # Load json config files from examples folder
+    example_files = glob("examples/*.json")
+    for example_file in example_files:
+        with open(example_file, encoding="utf-8") as f:
+            example = json.load(f)
+            try:
+                example_configs[example["name"]] = example
+            except KeyError:
+                print(f"Example {example_file} is missing a name field. Skipping.")
+    return example_configs
+EXAMPLE_REGISTRY = load_examples()
+# DB = SupabaseDB() if supabase_available else None
+def get_player_components(name, visible):
+    with gr.Row():
+        with gr.Column():
+            role_name = gr.Textbox(
+                lines=1,
+                show_label=False,
+                interactive=True,
+                visible=False,
+                value=name,
+            )
+            # is benign, is_knowledgeable, is_responsible,
+            # player_config = gr.CheckboxGroup(
+            #     choices=["Benign", "Knowledgeable", "Responsible"],
+            #     label="Reviewer Type",
+            #     visible=visible,
+            # )
+            with gr.Row():
+            # 将三个属性做成dropdown
+                Intention_config = gr.Dropdown(
+                    choices=["Benign", "Malicious", "Neutral"],
+                    interactive=True,
+                    label = "Intention",
+                    show_label=True,
+                    value="Neutral",
+                )
+                Knowledge_config = gr.Dropdown(
+                    choices=["Knowledgeable", "Unknownledgeable", "Normal"],
+                    interactive=True,
+                    label = "Knowledgeability",
+                    show_label=True,
+                    value="Normal",
+                )
+                Responsibility_config = gr.Dropdown(
+                    choices=["Responsible", "Lazy", "Normal"],
+                    interactive=True,
+                    label = "Responsibility",
+                    show_label=True,
+                    value="Normal",
+                )
+            role_desc = gr.Textbox(
+                lines=8,
+                max_lines=8,
+                show_label=False,
+                interactive=True,
+                visible=visible,
+                autoscroll=False,
+                value=get_reviewer_description()
+            )
+            # role_desc = gr.Markdown(value=get_reviewer_description(),
+            #                         visible=visible)
+            def update_role_desc(Intention_config, Knowledge_config, Responsibility_config):
+                is_benign = True if Intention_config == "Benign" else (False if Intention_config == "Malicious" else None)
+                is_knowledgeable = True if Knowledge_config == "Knowledgeable" else (False if Knowledge_config == "Unknownledgeable" else None)
+                is_responsible = True if Responsibility_config == "Responsible" else (False if Responsibility_config == "Lazy" else None)
+                phase = 'reviewer_write_reviews' if CURRENT_STEP_INDEX < 2 else 'reviewer_ac_discussion'
+                return get_reviewer_description(is_benign, is_knowledgeable, is_responsible, phase=phase)  # FIXME:依据阶段变化
+            Intention_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
+            Knowledge_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
+            Responsibility_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
+        with gr.Column():
+            backend_type = gr.Dropdown(
+                show_label=False,
+                choices=list(BACKEND_REGISTRY.keys()),
+                interactive=True,
+                visible=visible,
+                value=DEFAULT_BACKEND,
+            )
+            with gr.Accordion(
+                f"{name} Parameters", open=False, visible=visible
+            ) as accordion:
+                temperature = gr.Slider(
+                    minimum=0,
+                    maximum=2.0,
+                    step=0.1,
+                    interactive=True,
+                    visible=visible,
+                    label="temperature",
+                    value=0.7,
+                )
+                max_tokens = gr.Slider(
+                    minimum=10,
+                    maximum=500,
+                    step=10,
+                    interactive=True,
+                    visible=visible,
+                    label="max tokens",
+                    value=200,
+                )
+    return [role_name, Intention_config, Knowledge_config, Responsibility_config, backend_type, accordion, temperature, max_tokens]
+def get_area_chair_components(name, visible):
+    with gr.Row():
+        with gr.Column():
+            role_name = gr.Textbox(
+                lines=1,
+                show_label=False,
+                interactive=True,
+                visible=False,
+                value=name,
+            )
+            AC_type = gr.Dropdown(
+                label = "AC Type",
+                show_label=True,
+                choices=["Inclusive", "Conformist", "Authoritarian", "Normal"],
+                interactive=True,
+                visible=visible,
+                value="Normal",
+            )
+            role_desc = gr.Textbox(
+                lines=8,
+                max_lines=8,
+                show_label=False,
+                interactive=True,
+                visible=visible,
+                value=get_ac_description("BASELINE", "ac_write_metareviews", 'None', 1),
+            )
+            def update_role_desc(AC_type):
+                ac_type = 'BASELINE' if AC_type == "Normal" else AC_type.lower()
+                return get_ac_description(ac_type, "ac_write_metareviews", "None", 1) # FIXME:依据阶段变化
+            AC_type.select(fn=update_role_desc, inputs=[AC_type], outputs=[role_desc])
+        with gr.Column():
+            backend_type = gr.Dropdown(
+                show_label=False,
+                choices=list(BACKEND_REGISTRY.keys()),
+                interactive=True,
+                visible=visible,
+                value=DEFAULT_BACKEND,
+            )
+            with gr.Accordion(
+                f"{name} Parameters", open=False, visible=visible
+            ) as accordion:
+                temperature = gr.Slider(
+                    minimum=0,
+                    maximum=2.0,
+                    step=0.1,
+                    interactive=True,
+                    visible=visible,
+                    label="temperature",
+                    value=0.7,
+                )
+                max_tokens = gr.Slider(
+                    minimum=10,
+                    maximum=500,
+                    step=10,
+                    interactive=True,
+                    visible=visible,
+                    label="max tokens",
+                    value=200,
+                )
+    return [role_name, AC_type, backend_type, accordion, temperature, max_tokens]
+def get_empty_state():
+    return gr.State({"arena": None})
+with gr.Blocks(css=css) as demo:
+    state = get_empty_state()
+    all_components = []
+    with gr.Column(elem_id="col-container"):
+        gr.Markdown(
+            """# 🤖 AgentReview<br>
+Using Multi-Agent to review your paper!.
+**[Project Homepage](https://github.com/Ahren09/AgentReview)**""",
+            elem_id="header",
+        )
+        # Environment configuration
+        env_desc_textbox = gr.Textbox(
+            show_label=True,
+            lines=2,
+            visible=True,
+            label="Environment Description",
+            interactive=True,
+            # placeholder="Enter a description of a scenario or the game rules.",
+            value=const.GLOBAL_PROMPT,
+        )
+        all_components += [env_desc_textbox]
+        with gr.Row():
+            with gr.Column(elem_id="col-chatbox"):
+                with gr.Tab("All", visible=True):
+                    chatbot = gr.Chatbot(
+                        elem_id="chatbox", visible=True, show_label=False, height=600
+                    )
+                player_chatbots = []
+                for i in range(MAX_NUM_PLAYERS):
+                    player_name = f"Reviewer {i + 1}" if i < MAX_NUM_PLAYERS-1 else "AC"
+                    with gr.Tab(player_name, visible=(i < DEFAULT_NUM_PLAYERS)):
+                        player_chatbot = gr.Chatbot(
+                            elem_id=f"chatbox-{i}",
+                            visible=i < DEFAULT_NUM_PLAYERS,
+                            label=player_name,
+                            show_label=False,
+                            height=600,  # FIXME: 无效设置
+                        )
+                        player_chatbots.append(player_chatbot)
+            all_components += [chatbot, *player_chatbots]
+            with gr.Column(elem_id="col-config"):  # Player Configuration
+                # gr.Markdown("Player Configuration")
+                # parallel_checkbox = gr.Checkbox(
+                #     label="Parallel Actions", value=False, visible=True
+                # )
+                all_players_components, players_idx2comp = [], {}
+                with gr.Blocks():
+                    for i in range(MAX_NUM_PLAYERS):
+                        player_name = f"Reviewer {i + 1}" if i < MAX_NUM_PLAYERS-1 else "AC"
+                        with gr.Tab(
+                            player_name, visible=(i < DEFAULT_NUM_PLAYERS)
+                        ) as tab:
+                            if player_name != "AC":
+                                player_comps = get_player_components(
+                                    player_name, visible=(i < DEFAULT_NUM_PLAYERS)
+                                )
+                            else:
+                                player_comps = get_area_chair_components(
+                                    player_name, visible=(i < DEFAULT_NUM_PLAYERS)
+                                )
+                        players_idx2comp[i] = player_comps + [tab]
+                        all_players_components += player_comps + [tab]
+                all_components += all_players_components
+                # human_input_textbox = gr.Textbox(
+                #     show_label=True,
+                #     label="Human Input",
+                #     lines=1,
+                #     visible=True,
+                #     interactive=True,
+                #     placeholder="Upload your paper here",
+                # )
+                upload_file_box = gr.File(
+                    visible=True,
+                    height = 100,
+                )
+                with gr.Row():
+                    btn_step = gr.Button("Submit")
+                    btn_restart = gr.Button("Clear")
+                all_components += [upload_file_box, btn_step, btn_restart]
+    def _convert_to_chatbot_output(all_messages, display_recv=False):
+        chatbot_output = []
+        for i, message in enumerate(all_messages):
+            agent_name, msg, recv = (
+                message.agent_name,
+                message.content,
+                str(message.visible_to),
+            )
+            new_msg = re.sub(
+                r"\n+", "<br>", msg.strip()
+            )  # Preprocess message for chatbot output
+            if display_recv:
+                new_msg = f"**{agent_name} (-> {recv})**: {new_msg}"  # Add role to the message
+            else:
+                new_msg = f"**{agent_name}**: {new_msg}"
+            if agent_name == "Moderator":
+                chatbot_output.append((new_msg, None))
+            else:
+                chatbot_output.append((None, new_msg))
+        return chatbot_output
+    def _create_arena_config_from_components(all_comps: dict):
+        env_desc = all_comps[env_desc_textbox]
+        paper_pdf_path = all_comps[upload_file_box]
+        # Step 1: Initialize the players
+        num_players = MAX_NUM_PLAYERS
+        # 为了适应之前的接口填充无意义数据
+        conference = "EMNLP 2024"
+        paper_decision = "Accept"
+        data_dir = ''
+        paper_id = "12345"
+        args = Namespace(openai_client_type="openai",
+                         experiment_name="test",
+                         max_num_words=16384)
+        # 在paper_decision 阶段 中只启用 AC
+        players = []
+        # 不能直接获取role_desc，需要根据Intention_config, Knowledge_config, Responsibility_config生成一个配置
+        # self.environment.experiment_setting["players"]['Reviewer'][reviewer_index - 1]
+        experiment_setting = {
+        "paper_id": paper_id,
+        "paper_decision": paper_decision,
+        "players": {
+            # Paper Extractor is a special player that extracts a paper from the dataset.
+            # Its constructor does not take any arguments.
+            "Paper Extractor": [{}],
+            # Assume there is only one area chair (AC) in the experiment.
+            "AC": [],
+            # Author role with default configuration.
+            "Author": [{}],
+            # Reviewer settings are generated based on reviewer types provided in the settings.
+            "Reviewer": [],
+        },
+            # "global_settings": setting['global_settings']
+        }
+        for i in range(num_players):
+            if i < num_players-1: # reviewer
+                role_name, intention_config, knowledge_config, responsibility_config, backend_type, temperature, max_tokens = (
+                    all_comps[c]
+                    for c in players_idx2comp[i]
+                    if not isinstance(c, (gr.Accordion, gr.Tab))
+                )
+                is_benign = True if intention_config == "Benign" else (False if intention_config == "Malicious" else None)
+                is_knowledgeable = True if knowledge_config == "Knowledgeable" else (False if knowledge_config == "Unknownledgeable" else None)
+                is_responsible = True if responsibility_config == "Responsible" else (False if responsibility_config == "Lazy" else None)
+                experiment_setting["players"]['Reviewer'].append({"is_benign": is_benign,
+                                                                    "is_knowledgeable": is_knowledgeable,
+                                                                    "is_responsible": is_responsible,
+                                                                    "knows_authors": 'unfamous'})
+                role_desc = get_reviewer_description(is_benign, is_knowledgeable, is_responsible)
+            if i == num_players-1: # AC
+                role_name, ac_type, backend_type, temperature, max_tokens = (
+                    all_comps[c]
+                    for c in players_idx2comp[i]
+                    if not isinstance(c, (gr.Accordion, gr.Tab))
+                )
+                ac_type = 'BASELINE' if ac_type == "Normal" else ac_type.lower()
+                experiment_setting["players"]['AC'].append({"area_chair_type": ac_type})
+                role_desc = get_ac_description(ac_type, "ac_write_metareviews", "None", 1)
+            # common config for all players
+            player_config = {
+                "name": role_name,
+                "role_desc": role_desc,
+                "global_prompt": env_desc,
+                "backend": {
+                    "backend_type": backend_type,
+                    "temperature": temperature,
+                    "max_tokens": max_tokens,
+                },
+            }
+            player_config = AgentConfig(**player_config)
+            if i < num_players-1:
+                player = Reviewer(data_dir=data_dir, conference=conference, args=args, **player_config)
+            else:
+                player_config["env_type"] = "paper_review"
+                player = AreaChair(data_dir=data_dir, conference=conference, args=args, **player_config)
+            players.append(player)
+        # 根据上面的player_config和人造生成该阶段的players
+        # if CURRENT_STEP == "paper_review":
+        # 人为加入paper extractor
+        paper_extractor_config = get_paper_extractor_config(max_tokens=2048)
+        paper_extractor = PaperExtractorPlayer( paper_pdf_path=paper_pdf_path,
+                                                data_dir=data_dir, paper_id=paper_id,
+                                                paper_decision=paper_decision, args=args,
+                                                conference=conference, **paper_extractor_config)
+        players.append(paper_extractor)
+        # 人为加入author
+        author_config = get_author_config()
+        author = Player(data_dir=data_dir, conference=conference, args=args,
+                        **author_config)
+        players.append(author)
+        player_names = [player.name for player in players]
+        # Step 2: Initialize the environment
+        env = PaperReview(player_names=player_names, paper_decision=paper_decision, paper_id=paper_id,
+                          args=args, experiment_setting=experiment_setting)
+        # Step 3: Initialize the Arena
+        arena = PaperReviewArena(players=players, environment=env, args=args, global_prompt=env_desc)
+        return arena
+    def step_game(all_comps: dict):
+        global CURRENT_STEP_INDEX
+        yield {
+            btn_step: gr.update(value="Running...", interactive=False),
+            btn_restart: gr.update(interactive=False),
+        }
+        cur_state = all_comps[state]
+        # If arena is not yet created, create it
+        if cur_state["arena"] is None:
+            # Create the Arena
+            arena = _create_arena_config_from_components(all_comps)
+            cur_state["arena"] = arena
+        else:
+            arena = cur_state["arena"]
+        # 当timestep.terminal 为真时才停止运行
+        # TODO: 连续运行
+        timestep = arena.step()
+        CURRENT_STEP_INDEX = int(arena.environment.phase_index)
+        # 更新前端信息
+        if timestep:
+            all_messages = timestep.observation
+            all_messages[0].content = 'Paper content has been extracted.'
+            chatbot_output = _convert_to_chatbot_output(all_messages, display_recv=True)
+            update_dict = {
+                chatbot: chatbot_output,
+                btn_step: gr.update(
+                    value="Next Step", interactive=not timestep.terminal
+                ),
+                btn_restart: gr.update(interactive=True),
+                state: cur_state,
+            }
+            # Reviewer 1, 2, 3 Area Chair, Paper Extractor, Author
+            for i, player in enumerate(arena.players):
+                if 'Reviewer' in player.name and arena.environment.phase_index < 4: # FIXME: 临时逻辑
+                    player_messages = arena.environment.get_observation(player.name)
+                    # 不要显示第一条长段的信息，只显示 文章内容已被抽取
+                    player_messages[0].content = 'Paper content has been extracted.'
+                    player_output = _convert_to_chatbot_output(player_messages)
+                    # Update the player's chatbot output
+                    update_dict[player_chatbots[i]] = player_output
+                elif arena.environment.phase_index in [4, 5]: # FIXME: 临时逻辑
+                    player_messages = arena.environment.get_observation('AC')
+                    player_messages[0].content = 'Paper content has been extracted.'
+                    player_output = _convert_to_chatbot_output(player_messages)
+                    # Update the player's chatbot output
+                    update_dict[player_chatbots[3]] = player_output
+            yield update_dict
+    def restart_game(all_comps: dict):
+        global CURRENT_STEP_INDEX
+        CURRENT_STEP_INDEX = 0
+        cur_state = all_comps[state]
+        cur_state["arena"] = None
+        yield {
+            chatbot: [],
+            btn_restart: gr.update(interactive=False),
+            btn_step: gr.update(interactive=False),
+            state: cur_state,
+        }
+        # arena_config = _create_arena_config_from_components(all_comps)
+        # arena = Arena.from_config(arena_config)
+        # log_arena(arena, database=DB)
+        # cur_state["arena"] = arena
+        yield {
+            btn_step: gr.update(value="Start", interactive=True),
+            btn_restart: gr.update(interactive=True),
+            upload_file_box: gr.update(value=None),
+            state: cur_state,
+        }
+    # Remove Accordion and Tab from the list of components
+    all_components = [
+        comp for comp in all_components if not isinstance(comp, (gr.Accordion, gr.Tab))
+    ]
+    # update component
+    # env_desc_textbox.change()
+    # If any of the Textbox, Slider, Checkbox, Dropdown, RadioButtons is changed, the Step button is disabled
+    for comp in all_components:
+        def _disable_step_button(state):
+            if state["arena"] is not None:
+                return gr.update(interactive=False)
+            else:
+                return gr.update()
+        if (
+            isinstance(
+                comp, (gr.Textbox, gr.Slider, gr.Checkbox, gr.Dropdown, gr.Radio)
+            )
+            and comp is not upload_file_box
+        ):
+            comp.change(_disable_step_button, state, btn_step)
+    # print(set(all_components + [state]))
+    btn_step.click(
+        step_game,
+        set(all_components + [state]),
+        [chatbot, *player_chatbots, btn_step, btn_restart, state, upload_file_box],
+    )
+    btn_restart.click(
+        restart_game,
+        set(all_components + [state]),
+        [chatbot, *player_chatbots, btn_step, btn_restart, state, upload_file_box],
+    )
+demo.queue()
+demo.launch(debug=DEBUG, server_port=8082)

template.py ADDED Viewed

	@@ -0,0 +1,576 @@

+import json
+import re
+from glob import glob
+import gradio as gr
+from chatarena.arena import Arena, TooManyInvalidActions
+from chatarena.backends import BACKEND_REGISTRY
+from chatarena.backends.human import HumanBackendError
+from chatarena.config import ArenaConfig
+from chatarena.database import SupabaseDB, log_arena, log_messages, supabase_available
+from chatarena.environments import ENV_REGISTRY
+from chatarena.message import Message
+css = """#col-container {max-width: 90%; margin-left: auto; margin-right: auto; display: flex; flex-direction: column;}
+#header {text-align: center;}
+#col-chatbox {flex: 1; max-height: min(750px, 100%);}
+#label {font-size: 2em; padding: 0.5em; margin: 0;}
+.message {font-size: 1.2em;}
+.message-wrap {max-height: min(700px, 100vh);}
+"""
+# .wrap {min-width: min(640px, 100vh)}
+# #env-desc {max-height: 100px; overflow-y: auto;}
+# .textarea {height: 100px; max-height: 100px;}
+# #chatbot-tab-all {height: 750px; max-height: min(750px, 100%);}
+# #chatbox {height: min(750px, 100%); max-height: min(750px, 100%);}
+# #chatbox.block {height: 730px}
+# .wrap {max-height: 680px;}
+# .scroll-hide {overflow-y: scroll; max-height: 100px;}
+DEBUG = False
+DEFAULT_BACKEND = "openai-chat"
+DEFAULT_ENV = "conversation"
+MAX_NUM_PLAYERS = 6
+DEFAULT_NUM_PLAYERS = 2
+def load_examples():
+    example_configs = {}
+    # Load json config files from examples folder
+    example_files = glob("examples/*.json")
+    for example_file in example_files:
+        with open(example_file, encoding="utf-8") as f:
+            example = json.load(f)
+            try:
+                example_configs[example["name"]] = example
+            except KeyError:
+                print(f"Example {example_file} is missing a name field. Skipping.")
+    return example_configs
+EXAMPLE_REGISTRY = load_examples()
+DB = SupabaseDB() if supabase_available else None
+def get_moderator_components(visible=True):
+    name = "Moderator"
+    with gr.Row():
+        with gr.Column():
+            role_desc = gr.Textbox(
+                label="Moderator role",
+                lines=1,
+                visible=visible,
+                interactive=True,
+                placeholder=f"Enter the role description for {name}",
+            )
+            terminal_condition = gr.Textbox(
+                show_label=False,
+                lines=1,
+                visible=visible,
+                interactive=True,
+                placeholder="Enter the termination criteria",
+            )
+        with gr.Column():
+            backend_type = gr.Dropdown(
+                show_label=False,
+                visible=visible,
+                interactive=True,
+                choices=list(BACKEND_REGISTRY.keys()),
+                value=DEFAULT_BACKEND,
+            )
+            with gr.Accordion(
+                f"{name} Parameters", open=False, visible=visible
+            ) as accordion:
+                temperature = gr.Slider(
+                    minimum=0,
+                    maximum=2.0,
+                    step=0.1,
+                    interactive=True,
+                    visible=visible,
+                    label="temperature",
+                    value=0.7,
+                )
+                max_tokens = gr.Slider(
+                    minimum=10,
+                    maximum=500,
+                    step=10,
+                    interactive=True,
+                    visible=visible,
+                    label="max tokens",
+                    value=200,
+                )
+    return [
+        role_desc,
+        terminal_condition,
+        backend_type,
+        accordion,
+        temperature,
+        max_tokens,
+    ]
+def get_player_components(name, visible):
+    with gr.Row():
+        with gr.Column():
+            role_name = gr.Textbox(
+                line=1,
+                show_label=False,
+                interactive=True,
+                visible=visible,
+                placeholder=f"Player name for {name}",
+            )
+            role_desc = gr.Textbox(
+                lines=3,
+                show_label=False,
+                interactive=True,
+                visible=visible,
+                placeholder=f"Enter the role description for {name}",
+            )
+        with gr.Column():
+            backend_type = gr.Dropdown(
+                show_label=False,
+                choices=list(BACKEND_REGISTRY.keys()),
+                interactive=True,
+                visible=visible,
+                value=DEFAULT_BACKEND,
+            )
+            with gr.Accordion(
+                f"{name} Parameters", open=False, visible=visible
+            ) as accordion:
+                temperature = gr.Slider(
+                    minimum=0,
+                    maximum=2.0,
+                    step=0.1,
+                    interactive=True,
+                    visible=visible,
+                    label="temperature",
+                    value=0.7,
+                )
+                max_tokens = gr.Slider(
+                    minimum=10,
+                    maximum=500,
+                    step=10,
+                    interactive=True,
+                    visible=visible,
+                    label="max tokens",
+                    value=200,
+                )
+    return [role_name, role_desc, backend_type, accordion, temperature, max_tokens]
+def get_empty_state():
+    return gr.State({"arena": None})
+with gr.Blocks(css=css) as demo:
+    state = get_empty_state()
+    all_components = []
+    with gr.Column(elem_id="col-container"):
+        gr.Markdown(
+            """# 🏟 ChatArena️<br>
+Prompting multiple AI agents to play games in a language-driven environment.
+**[Project Homepage](https://github.com/chatarena/chatarena)**""",
+            elem_id="header",
+        )
+        with gr.Row():
+            env_selector = gr.Dropdown(
+                choices=list(ENV_REGISTRY.keys()),
+                value=DEFAULT_ENV,
+                interactive=True,
+                label="Environment Type",
+                show_label=True,
+            )
+            example_selector = gr.Dropdown(
+                choices=list(EXAMPLE_REGISTRY.keys()),
+                interactive=True,
+                label="Select Example",
+                show_label=True,
+            )
+        # Environment configuration
+        env_desc_textbox = gr.Textbox(
+            show_label=True,
+            lines=2,
+            visible=True,
+            label="Environment Description",
+            placeholder="Enter a description of a scenario or the game rules.",
+        )
+        all_components += [env_selector, example_selector, env_desc_textbox]
+        with gr.Row():
+            with gr.Column(elem_id="col-chatbox"):
+                with gr.Tab("All", visible=True):
+                    chatbot = gr.Chatbot(
+                        elem_id="chatbox", visible=True, show_label=False
+                    )
+                player_chatbots = []
+                for i in range(MAX_NUM_PLAYERS):
+                    player_name = f"Player {i + 1}"
+                    with gr.Tab(player_name, visible=(i < DEFAULT_NUM_PLAYERS)):
+                        player_chatbot = gr.Chatbot(
+                            elem_id=f"chatbox-{i}",
+                            visible=i < DEFAULT_NUM_PLAYERS,
+                            label=player_name,
+                            show_label=False,
+                        )
+                        player_chatbots.append(player_chatbot)
+            all_components += [chatbot, *player_chatbots]
+            with gr.Column(elem_id="col-config"):  # Player Configuration
+                # gr.Markdown("Player Configuration")
+                parallel_checkbox = gr.Checkbox(
+                    label="Parallel Actions", value=False, visible=True
+                )
+                with gr.Accordion("Moderator", open=False, visible=True):
+                    moderator_components = get_moderator_components(True)
+                all_components += [parallel_checkbox, *moderator_components]
+                all_players_components, players_idx2comp = [], {}
+                with gr.Blocks():
+                    num_player_slider = gr.Slider(
+                        2,
+                        MAX_NUM_PLAYERS,
+                        value=DEFAULT_NUM_PLAYERS,
+                        step=1,
+                        label="Number of players:",
+                    )
+                    for i in range(MAX_NUM_PLAYERS):
+                        player_name = f"Player {i + 1}"
+                        with gr.Tab(
+                            player_name, visible=(i < DEFAULT_NUM_PLAYERS)
+                        ) as tab:
+                            player_comps = get_player_components(
+                                player_name, visible=(i < DEFAULT_NUM_PLAYERS)
+                            )
+                        players_idx2comp[i] = player_comps + [tab]
+                        all_players_components += player_comps + [tab]
+                all_components += [num_player_slider] + all_players_components
+                def variable_players(k):
+                    k = int(k)
+                    update_dict = {}
+                    for i in range(MAX_NUM_PLAYERS):
+                        if i < k:
+                            for comp in players_idx2comp[i]:
+                                update_dict[comp] = gr.update(visible=True)
+                            update_dict[player_chatbots[i]] = gr.update(visible=True)
+                        else:
+                            for comp in players_idx2comp[i]:
+                                update_dict[comp] = gr.update(visible=False)
+                            update_dict[player_chatbots[i]] = gr.update(visible=False)
+                    return update_dict
+                num_player_slider.change(
+                    variable_players,
+                    num_player_slider,
+                    all_players_components + player_chatbots,
+                )
+                human_input_textbox = gr.Textbox(
+                    show_label=True,
+                    label="Human Input",
+                    lines=1,
+                    visible=True,
+                    interactive=True,
+                    placeholder="Enter your input here",
+                )
+                with gr.Row():
+                    btn_step = gr.Button("Start")
+                    btn_restart = gr.Button("Clear")
+                all_components += [human_input_textbox, btn_step, btn_restart]
+    def _convert_to_chatbot_output(all_messages, display_recv=False):
+        chatbot_output = []
+        for i, message in enumerate(all_messages):
+            agent_name, msg, recv = (
+                message.agent_name,
+                message.content,
+                str(message.visible_to),
+            )
+            new_msg = re.sub(
+                r"\n+", "<br>", msg.strip()
+            )  # Preprocess message for chatbot output
+            if display_recv:
+                new_msg = f"**{agent_name} (-> {recv})**: {new_msg}"  # Add role to the message
+            else:
+                new_msg = f"**{agent_name}**: {new_msg}"
+            if agent_name == "Moderator":
+                chatbot_output.append((new_msg, None))
+            else:
+                chatbot_output.append((None, new_msg))
+        return chatbot_output
+    def _create_arena_config_from_components(all_comps: dict) -> ArenaConfig:
+        env_desc = all_comps[env_desc_textbox]
+        # Initialize the players
+        num_players = all_comps[num_player_slider]
+        player_configs = []
+        for i in range(num_players):
+            role_name, role_desc, backend_type, temperature, max_tokens = (
+                all_comps[c]
+                for c in players_idx2comp[i]
+                if not isinstance(c, (gr.Accordion, gr.Tab))
+            )
+            player_config = {
+                "name": role_name,
+                "role_desc": role_desc,
+                "global_prompt": env_desc,
+                "backend": {
+                    "backend_type": backend_type,
+                    "temperature": temperature,
+                    "max_tokens": max_tokens,
+                },
+            }
+            player_configs.append(player_config)
+        # Initialize the environment
+        env_type = all_comps[env_selector]
+        # Get moderator config
+        (
+            mod_role_desc,
+            mod_terminal_condition,
+            moderator_backend_type,
+            mod_temp,
+            mod_max_tokens,
+        ) = (
+            all_comps[c]
+            for c in moderator_components
+            if not isinstance(c, (gr.Accordion, gr.Tab))
+        )
+        moderator_config = {
+            "role_desc": mod_role_desc,
+            "global_prompt": env_desc,
+            "terminal_condition": mod_terminal_condition,
+            "backend": {
+                "backend_type": moderator_backend_type,
+                "temperature": mod_temp,
+                "max_tokens": mod_max_tokens,
+            },
+        }
+        env_config = {
+            "env_type": env_type,
+            "parallel": all_comps[parallel_checkbox],
+            "moderator": moderator_config,
+            "moderator_visibility": "all",
+            "moderator_period": None,
+        }
+        # arena_config = {"players": player_configs, "environment": env_config}
+        arena_config = ArenaConfig(players=player_configs, environment=env_config)
+        return arena_config
+    def step_game(all_comps: dict):
+        yield {
+            btn_step: gr.update(value="Running...", interactive=False),
+            btn_restart: gr.update(interactive=False),
+        }
+        cur_state = all_comps[state]
+        # If arena is not yet created, create it
+        if cur_state["arena"] is None:
+            # Create the Arena
+            arena_config = _create_arena_config_from_components(all_comps)
+            arena = Arena.from_config(arena_config)
+            log_arena(arena, database=DB)
+            cur_state["arena"] = arena
+        else:
+            arena = cur_state["arena"]
+        try:
+            timestep = arena.step()
+        except HumanBackendError as e:
+            # Handle human input and recover with the game update
+            human_input = all_comps[human_input_textbox]
+            if human_input == "":
+                timestep = None  # Failed to get human input
+            else:
+                timestep = arena.environment.step(e.agent_name, human_input)
+        except TooManyInvalidActions:
+            timestep = arena.current_timestep
+            timestep.observation.append(
+                Message(
+                    "System",
+                    "Too many invalid actions. Game over.",
+                    turn=-1,
+                    visible_to="all",
+                )
+            )
+            timestep.terminal = True
+        if timestep is None:
+            yield {
+                human_input_textbox: gr.update(
+                    value="", placeholder="Please enter a valid input"
+                ),
+                btn_step: gr.update(value="Next Step", interactive=True),
+                btn_restart: gr.update(interactive=True),
+            }
+        else:
+            all_messages = timestep.observation  # user sees what the moderator sees
+            log_messages(arena, all_messages, database=DB)
+            chatbot_output = _convert_to_chatbot_output(all_messages, display_recv=True)
+            update_dict = {
+                human_input_textbox: gr.Textbox.update(value=""),
+                chatbot: chatbot_output,
+                btn_step: gr.update(
+                    value="Next Step", interactive=not timestep.terminal
+                ),
+                btn_restart: gr.update(interactive=True),
+                state: cur_state,
+            }
+            # Get the visible messages for each player
+            for i, player in enumerate(arena.players):
+                player_messages = arena.environment.get_observation(player.name)
+                player_output = _convert_to_chatbot_output(player_messages)
+                # Update the player's chatbot output
+                update_dict[player_chatbots[i]] = player_output
+            if DEBUG:
+                arena.environment.print()
+            yield update_dict
+    def restart_game(all_comps: dict):
+        cur_state = all_comps[state]
+        cur_state["arena"] = None
+        yield {
+            chatbot: [],
+            btn_restart: gr.update(interactive=False),
+            btn_step: gr.update(interactive=False),
+            state: cur_state,
+        }
+        arena_config = _create_arena_config_from_components(all_comps)
+        arena = Arena.from_config(arena_config)
+        log_arena(arena, database=DB)
+        cur_state["arena"] = arena
+        yield {
+            btn_step: gr.update(value="Start", interactive=True),
+            btn_restart: gr.update(interactive=True),
+            state: cur_state,
+        }
+    # Remove Accordion and Tab from the list of components
+    all_components = [
+        comp for comp in all_components if not isinstance(comp, (gr.Accordion, gr.Tab))
+    ]
+    # If any of the Textbox, Slider, Checkbox, Dropdown, RadioButtons is changed, the Step button is disabled
+    for comp in all_components:
+        def _disable_step_button(state):
+            if state["arena"] is not None:
+                return gr.update(interactive=False)
+            else:
+                return gr.update()
+        if (
+            isinstance(
+                comp, (gr.Textbox, gr.Slider, gr.Checkbox, gr.Dropdown, gr.Radio)
+            )
+            and comp is not human_input_textbox
+        ):
+            comp.change(_disable_step_button, state, btn_step)
+    btn_step.click(
+        step_game,
+        set(all_components + [state]),
+        [chatbot, *player_chatbots, btn_step, btn_restart, state, human_input_textbox],
+    )
+    btn_restart.click(
+        restart_game,
+        set(all_components + [state]),
+        [chatbot, *player_chatbots, btn_step, btn_restart, state, human_input_textbox],
+    )
+    # If an example is selected, update the components
+    def update_components_from_example(all_comps: dict):
+        example_name = all_comps[example_selector]
+        example_config = EXAMPLE_REGISTRY[example_name]
+        update_dict = {}
+        # Update the environment components
+        env_config = example_config["environment"]
+        update_dict[env_desc_textbox] = gr.update(value=example_config["global_prompt"])
+        update_dict[env_selector] = gr.update(value=env_config["env_type"])
+        update_dict[parallel_checkbox] = gr.update(value=env_config["parallel"])
+        # Update the moderator components
+        if "moderator" in env_config:
+            (
+                mod_role_desc,
+                mod_terminal_condition,
+                moderator_backend_type,
+                mod_temp,
+                mod_max_tokens,
+            ) = (
+                c
+                for c in moderator_components
+                if not isinstance(c, (gr.Accordion, gr.Tab))
+            )
+            update_dict[mod_role_desc] = gr.update(
+                value=env_config["moderator"]["role_desc"]
+            )
+            update_dict[mod_terminal_condition] = gr.update(
+                value=env_config["moderator"]["terminal_condition"]
+            )
+            update_dict[moderator_backend_type] = gr.update(
+                value=env_config["moderator"]["backend"]["backend_type"]
+            )
+            update_dict[mod_temp] = gr.update(
+                value=env_config["moderator"]["backend"]["temperature"]
+            )
+            update_dict[mod_max_tokens] = gr.update(
+                value=env_config["moderator"]["backend"]["max_tokens"]
+            )
+        # Update the player components
+        update_dict[num_player_slider] = gr.update(value=len(example_config["players"]))
+        for i, player_config in enumerate(example_config["players"]):
+            role_name, role_desc, backend_type, temperature, max_tokens = (
+                c
+                for c in players_idx2comp[i]
+                if not isinstance(c, (gr.Accordion, gr.Tab))
+            )
+            update_dict[role_name] = gr.update(value=player_config["name"])
+            update_dict[role_desc] = gr.update(value=player_config["role_desc"])
+            update_dict[backend_type] = gr.update(
+                value=player_config["backend"]["backend_type"]
+            )
+            update_dict[temperature] = gr.update(
+                value=player_config["backend"]["temperature"]
+            )
+            update_dict[max_tokens] = gr.update(
+                value=player_config["backend"]["max_tokens"]
+            )
+        return update_dict
+    example_selector.change(
+        update_components_from_example,
+        set(all_components + [state]),
+        all_components + [state],
+    )
+demo.queue()
+demo.launch(debug=DEBUG, server_port=8080)