import json
import re
from glob import glob
from argparse import Namespace
import gradio as gr
from agentreview import const
from agentreview.config import AgentConfig
from agentreview.agent import Player
from agentreview.backends import BACKEND_REGISTRY
from agentreview.environments import PaperReview
from agentreview.paper_review_arena import PaperReviewArena
from agentreview.utility.experiment_utils import initialize_players
from agentreview.paper_review_player import PaperExtractorPlayer, AreaChair, Reviewer
from agentreview.role_descriptions import get_reviewer_description, get_ac_description, get_author_config, get_paper_extractor_config
# 该文件的使命是前端交互:构建前端页面,从页面中获取用户的配置,传入后端运行,将结果实时展示到相应模块
css = """#col-container {max-width: 90%; margin-left: auto; margin-right: auto; display: flex; flex-direction: column;}
#header {text-align: center;}
#col-chatbox {flex: 1; max-height: min(900px, 100%);}
#label {font-size: 2em; padding: 0.5em; margin: 0;}
.message {font-size: 1.2em;}
.message-wrap {max-height: min(700px, 100vh);}
"""
# .wrap {min-width: min(640px, 100vh)}
# #env-desc {max-height: 100px; overflow-y: auto;}
# .textarea {height: 100px; max-height: 100px;}
# #chatbot-tab-all {height: 750px; max-height: min(750px, 100%);}
# #chatbox {height: min(750px, 100%); max-height: min(750px, 100%);}
# #chatbox.block {height: 730px}
# .wrap {max-height: 680px;}
# .scroll-hide {overflow-y: scroll; max-height: 100px;}
DEBUG = False
DEFAULT_BACKEND = "openai-chat"
MAX_NUM_PLAYERS = 4
DEFAULT_NUM_PLAYERS = 4
CURRENT_STEP_INDEX = 0
def load_examples():
example_configs = {}
# Load json config files from examples folder
example_files = glob("examples/*.json")
for example_file in example_files:
with open(example_file, encoding="utf-8") as f:
example = json.load(f)
try:
example_configs[example["name"]] = example
except KeyError:
print(f"Example {example_file} is missing a name field. Skipping.")
return example_configs
EXAMPLE_REGISTRY = load_examples()
# DB = SupabaseDB() if supabase_available else None
def get_player_components(name, visible):
with gr.Row():
with gr.Column():
role_name = gr.Textbox(
lines=1,
show_label=False,
interactive=True,
visible=False,
value=name,
)
# is benign, is_knowledgeable, is_responsible,
# player_config = gr.CheckboxGroup(
# choices=["Benign", "Knowledgeable", "Responsible"],
# label="Reviewer Type",
# visible=visible,
# )
with gr.Row():
# 将三个属性做成dropdown
Intention_config = gr.Dropdown(
choices=["Benign", "Malicious", "Neutral"],
interactive=True,
label = "Intention",
show_label=True,
value="Neutral",
)
Knowledge_config = gr.Dropdown(
choices=["Knowledgeable", "Unknownledgeable", "Normal"],
interactive=True,
label = "Knowledgeability",
show_label=True,
value="Normal",
)
Responsibility_config = gr.Dropdown(
choices=["Responsible", "Lazy", "Normal"],
interactive=True,
label = "Responsibility",
show_label=True,
value="Normal",
)
role_desc = gr.Textbox(
lines=8,
max_lines=8,
show_label=False,
interactive=True,
visible=visible,
autoscroll=False,
value=get_reviewer_description()
)
# role_desc = gr.Markdown(value=get_reviewer_description(),
# visible=visible)
def update_role_desc(Intention_config, Knowledge_config, Responsibility_config):
is_benign = True if Intention_config == "Benign" else (False if Intention_config == "Malicious" else None)
is_knowledgeable = True if Knowledge_config == "Knowledgeable" else (False if Knowledge_config == "Unknownledgeable" else None)
is_responsible = True if Responsibility_config == "Responsible" else (False if Responsibility_config == "Lazy" else None)
phase = 'reviewer_write_reviews' if CURRENT_STEP_INDEX < 2 else 'reviewer_ac_discussion'
return get_reviewer_description(is_benign, is_knowledgeable, is_responsible, phase=phase) # FIXME:依据阶段变化
Intention_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
Knowledge_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
Responsibility_config.select(fn=update_role_desc, inputs=[Intention_config, Knowledge_config, Responsibility_config], outputs=[role_desc])
with gr.Column():
backend_type = gr.Dropdown(
show_label=False,
choices=list(BACKEND_REGISTRY.keys()),
interactive=True,
visible=visible,
value=DEFAULT_BACKEND,
)
with gr.Accordion(
f"{name} Parameters", open=False, visible=visible
) as accordion:
temperature = gr.Slider(
minimum=0,
maximum=2.0,
step=0.1,
interactive=True,
visible=visible,
label="temperature",
value=0.7,
)
max_tokens = gr.Slider(
minimum=10,
maximum=500,
step=10,
interactive=True,
visible=visible,
label="max tokens",
value=200,
)
return [role_name, Intention_config, Knowledge_config, Responsibility_config, backend_type, accordion, temperature, max_tokens]
def get_area_chair_components(name, visible):
with gr.Row():
with gr.Column():
role_name = gr.Textbox(
lines=1,
show_label=False,
interactive=True,
visible=False,
value=name,
)
AC_type = gr.Dropdown(
label = "AC Type",
show_label=True,
choices=["Inclusive", "Conformist", "Authoritarian", "Normal"],
interactive=True,
visible=visible,
value="Normal",
)
role_desc = gr.Textbox(
lines=8,
max_lines=8,
show_label=False,
interactive=True,
visible=visible,
value=get_ac_description("BASELINE", "ac_write_metareviews", 'None', 1),
)
def update_role_desc(AC_type):
ac_type = 'BASELINE' if AC_type == "Normal" else AC_type.lower()
return get_ac_description(ac_type, "ac_write_metareviews", "None", 1) # FIXME:依据阶段变化
AC_type.select(fn=update_role_desc, inputs=[AC_type], outputs=[role_desc])
with gr.Column():
backend_type = gr.Dropdown(
show_label=False,
choices=list(BACKEND_REGISTRY.keys()),
interactive=True,
visible=visible,
value=DEFAULT_BACKEND,
)
with gr.Accordion(
f"{name} Parameters", open=False, visible=visible
) as accordion:
temperature = gr.Slider(
minimum=0,
maximum=2.0,
step=0.1,
interactive=True,
visible=visible,
label="temperature",
value=0.7,
)
max_tokens = gr.Slider(
minimum=10,
maximum=500,
step=10,
interactive=True,
visible=visible,
label="max tokens",
value=200,
)
return [role_name, AC_type, backend_type, accordion, temperature, max_tokens]
def get_empty_state():
return gr.State({"arena": None})
with gr.Blocks(css=css) as demo:
state = get_empty_state()
all_components = []
with gr.Column(elem_id="col-container"):
gr.Markdown(
"""# 🤖 AgentReview
Using Multi-Agent to review your paper!.
**[Project Homepage](https://github.com/Ahren09/AgentReview)**""",
elem_id="header",
)
# Environment configuration
env_desc_textbox = gr.Textbox(
show_label=True,
lines=2,
visible=True,
label="Environment Description",
interactive=True,
# placeholder="Enter a description of a scenario or the game rules.",
value=const.GLOBAL_PROMPT,
)
all_components += [env_desc_textbox]
with gr.Row():
with gr.Column(elem_id="col-chatbox"):
with gr.Tab("All", visible=True):
chatbot = gr.Chatbot(
elem_id="chatbox", visible=True, show_label=False, height=600
)
player_chatbots = []
for i in range(MAX_NUM_PLAYERS):
player_name = f"Reviewer {i + 1}" if i < MAX_NUM_PLAYERS-1 else "AC"
with gr.Tab(player_name, visible=(i < DEFAULT_NUM_PLAYERS)):
player_chatbot = gr.Chatbot(
elem_id=f"chatbox-{i}",
visible=i < DEFAULT_NUM_PLAYERS,
label=player_name,
show_label=False,
height=600, # FIXME: 无效设置
)
player_chatbots.append(player_chatbot)
all_components += [chatbot, *player_chatbots]
with gr.Column(elem_id="col-config"): # Player Configuration
# gr.Markdown("Player Configuration")
# parallel_checkbox = gr.Checkbox(
# label="Parallel Actions", value=False, visible=True
# )
all_players_components, players_idx2comp = [], {}
with gr.Blocks():
for i in range(MAX_NUM_PLAYERS):
player_name = f"Reviewer {i + 1}" if i < MAX_NUM_PLAYERS-1 else "AC"
with gr.Tab(
player_name, visible=(i < DEFAULT_NUM_PLAYERS)
) as tab:
if player_name != "AC":
player_comps = get_player_components(
player_name, visible=(i < DEFAULT_NUM_PLAYERS)
)
else:
player_comps = get_area_chair_components(
player_name, visible=(i < DEFAULT_NUM_PLAYERS)
)
players_idx2comp[i] = player_comps + [tab]
all_players_components += player_comps + [tab]
all_components += all_players_components
# human_input_textbox = gr.Textbox(
# show_label=True,
# label="Human Input",
# lines=1,
# visible=True,
# interactive=True,
# placeholder="Upload your paper here",
# )
upload_file_box = gr.File(
visible=True,
height = 100,
)
with gr.Row():
btn_step = gr.Button("Submit")
btn_restart = gr.Button("Clear")
all_components += [upload_file_box, btn_step, btn_restart]
def _convert_to_chatbot_output(all_messages, display_recv=False):
chatbot_output = []
for i, message in enumerate(all_messages):
agent_name, msg, recv = (
message.agent_name,
message.content,
str(message.visible_to),
)
new_msg = re.sub(
r"\n+", "
", msg.strip()
) # Preprocess message for chatbot output
if display_recv:
new_msg = f"**{agent_name} (-> {recv})**: {new_msg}" # Add role to the message
else:
new_msg = f"**{agent_name}**: {new_msg}"
if agent_name == "Moderator":
chatbot_output.append((new_msg, None))
else:
chatbot_output.append((None, new_msg))
return chatbot_output
def _create_arena_config_from_components(all_comps: dict):
env_desc = all_comps[env_desc_textbox]
paper_pdf_path = all_comps[upload_file_box]
# Step 1: Initialize the players
num_players = MAX_NUM_PLAYERS
# 为了适应之前的接口填充无意义数据
conference = "EMNLP 2024"
paper_decision = "Accept"
data_dir = ''
paper_id = "12345"
args = Namespace(openai_client_type="openai",
experiment_name="test",
max_num_words=16384)
# 在paper_decision 阶段 中只启用 AC
players = []
# 不能直接获取role_desc,需要根据Intention_config, Knowledge_config, Responsibility_config生成一个配置
# self.environment.experiment_setting["players"]['Reviewer'][reviewer_index - 1]
experiment_setting = {
"paper_id": paper_id,
"paper_decision": paper_decision,
"players": {
# Paper Extractor is a special player that extracts a paper from the dataset.
# Its constructor does not take any arguments.
"Paper Extractor": [{}],
# Assume there is only one area chair (AC) in the experiment.
"AC": [],
# Author role with default configuration.
"Author": [{}],
# Reviewer settings are generated based on reviewer types provided in the settings.
"Reviewer": [],
},
# "global_settings": setting['global_settings']
}
for i in range(num_players):
if i < num_players-1: # reviewer
role_name, intention_config, knowledge_config, responsibility_config, backend_type, temperature, max_tokens = (
all_comps[c]
for c in players_idx2comp[i]
if not isinstance(c, (gr.Accordion, gr.Tab))
)
is_benign = True if intention_config == "Benign" else (False if intention_config == "Malicious" else None)
is_knowledgeable = True if knowledge_config == "Knowledgeable" else (False if knowledge_config == "Unknownledgeable" else None)
is_responsible = True if responsibility_config == "Responsible" else (False if responsibility_config == "Lazy" else None)
experiment_setting["players"]['Reviewer'].append({"is_benign": is_benign,
"is_knowledgeable": is_knowledgeable,
"is_responsible": is_responsible,
"knows_authors": 'unfamous'})
role_desc = get_reviewer_description(is_benign, is_knowledgeable, is_responsible)
if i == num_players-1: # AC
role_name, ac_type, backend_type, temperature, max_tokens = (
all_comps[c]
for c in players_idx2comp[i]
if not isinstance(c, (gr.Accordion, gr.Tab))
)
ac_type = 'BASELINE' if ac_type == "Normal" else ac_type.lower()
experiment_setting["players"]['AC'].append({"area_chair_type": ac_type})
role_desc = get_ac_description(ac_type, "ac_write_metareviews", "None", 1)
# common config for all players
player_config = {
"name": role_name,
"role_desc": role_desc,
"global_prompt": env_desc,
"backend": {
"backend_type": backend_type,
"temperature": temperature,
"max_tokens": max_tokens,
},
}
player_config = AgentConfig(**player_config)
if i < num_players-1:
player = Reviewer(data_dir=data_dir, conference=conference, args=args, **player_config)
else:
player_config["env_type"] = "paper_review"
player = AreaChair(data_dir=data_dir, conference=conference, args=args, **player_config)
players.append(player)
# 根据上面的player_config和人造生成该阶段的players
# if CURRENT_STEP == "paper_review":
# 人为加入paper extractor
paper_extractor_config = get_paper_extractor_config(max_tokens=2048)
paper_extractor = PaperExtractorPlayer( paper_pdf_path=paper_pdf_path,
data_dir=data_dir, paper_id=paper_id,
paper_decision=paper_decision, args=args,
conference=conference, **paper_extractor_config)
players.append(paper_extractor)
# 人为加入author
author_config = get_author_config()
author = Player(data_dir=data_dir, conference=conference, args=args,
**author_config)
players.append(author)
player_names = [player.name for player in players]
# Step 2: Initialize the environment
env = PaperReview(player_names=player_names, paper_decision=paper_decision, paper_id=paper_id,
args=args, experiment_setting=experiment_setting)
# Step 3: Initialize the Arena
arena = PaperReviewArena(players=players, environment=env, args=args, global_prompt=env_desc)
return arena
def step_game(all_comps: dict):
global CURRENT_STEP_INDEX
yield {
btn_step: gr.update(value="Running...", interactive=False),
btn_restart: gr.update(interactive=False),
}
cur_state = all_comps[state]
# If arena is not yet created, create it
if cur_state["arena"] is None:
# Create the Arena
arena = _create_arena_config_from_components(all_comps)
cur_state["arena"] = arena
else:
arena = cur_state["arena"]
# 当timestep.terminal 为真时才停止运行
# TODO: 连续运行
timestep = arena.step()
CURRENT_STEP_INDEX = int(arena.environment.phase_index)
# 更新前端信息
if timestep:
all_messages = timestep.observation
all_messages[0].content = 'Paper content has been extracted.'
chatbot_output = _convert_to_chatbot_output(all_messages, display_recv=True)
update_dict = {
chatbot: chatbot_output,
btn_step: gr.update(
value="Next Step", interactive=not timestep.terminal
),
btn_restart: gr.update(interactive=True),
state: cur_state,
}
# Reviewer 1, 2, 3 Area Chair, Paper Extractor, Author
for i, player in enumerate(arena.players):
if 'Reviewer' in player.name and arena.environment.phase_index < 4: # FIXME: 临时逻辑
player_messages = arena.environment.get_observation(player.name)
# 不要显示第一条长段的信息,只显示 文章内容已被抽取
player_messages[0].content = 'Paper content has been extracted.'
player_output = _convert_to_chatbot_output(player_messages)
# Update the player's chatbot output
update_dict[player_chatbots[i]] = player_output
elif arena.environment.phase_index in [4, 5]: # FIXME: 临时逻辑
player_messages = arena.environment.get_observation('AC')
player_messages[0].content = 'Paper content has been extracted.'
player_output = _convert_to_chatbot_output(player_messages)
# Update the player's chatbot output
update_dict[player_chatbots[3]] = player_output
yield update_dict
def restart_game(all_comps: dict):
global CURRENT_STEP_INDEX
CURRENT_STEP_INDEX = 0
cur_state = all_comps[state]
cur_state["arena"] = None
yield {
chatbot: [],
btn_restart: gr.update(interactive=False),
btn_step: gr.update(interactive=False),
state: cur_state,
}
# arena_config = _create_arena_config_from_components(all_comps)
# arena = Arena.from_config(arena_config)
# log_arena(arena, database=DB)
# cur_state["arena"] = arena
yield {
btn_step: gr.update(value="Start", interactive=True),
btn_restart: gr.update(interactive=True),
upload_file_box: gr.update(value=None),
state: cur_state,
}
# Remove Accordion and Tab from the list of components
all_components = [
comp for comp in all_components if not isinstance(comp, (gr.Accordion, gr.Tab))
]
# update component
# env_desc_textbox.change()
# If any of the Textbox, Slider, Checkbox, Dropdown, RadioButtons is changed, the Step button is disabled
for comp in all_components:
def _disable_step_button(state):
if state["arena"] is not None:
return gr.update(interactive=False)
else:
return gr.update()
if (
isinstance(
comp, (gr.Textbox, gr.Slider, gr.Checkbox, gr.Dropdown, gr.Radio)
)
and comp is not upload_file_box
):
comp.change(_disable_step_button, state, btn_step)
# print(set(all_components + [state]))
btn_step.click(
step_game,
set(all_components + [state]),
[chatbot, *player_chatbots, btn_step, btn_restart, state, upload_file_box],
)
btn_restart.click(
restart_game,
set(all_components + [state]),
[chatbot, *player_chatbots, btn_step, btn_restart, state, upload_file_box],
)
demo.queue()
demo.launch(debug=DEBUG, server_port=8082)