Skip to content

Commit cf910df

Browse files
authored
fix eval api_key leak in metadata; fix llm config in run infer (OpenHands#2998)
1 parent 692fe21 commit cf910df

16 files changed

Lines changed: 34 additions & 15 deletions

File tree

evaluation/EDA/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ def process_instance(
6262
reset_logger: bool = True,
6363
):
6464
# Create the agent
65-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
65+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
6666
# Setup the logger properly, so you can run multi-processing to parallelize the evaluation
6767
eval_output_dir = metadata.eval_output_dir
6868
if reset_logger:

evaluation/agent_bench/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ def process_instance(
3737
reset_logger: bool = True,
3838
):
3939
# Create the agent
40-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
40+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
4141

4242
inst_id = instance.instance_id
4343
question = instance.description

evaluation/biocoder/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@ def process_instance(
8787
reset_logger: bool = True,
8888
):
8989
# Create the agent
90-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
90+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
9191
instance = BiocoderData(**instance)
9292
print(instance)
9393
workspace_dir_name = (

evaluation/bird/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -126,7 +126,7 @@ def process_instance(
126126
reset_logger: bool = True,
127127
):
128128
# Create the agent
129-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
129+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
130130
workspace_mount_path = os.path.join(
131131
config.workspace_mount_path, 'bird_eval_workspace'
132132
)

evaluation/browsing_delegation/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ def process_instance(
3131
reset_logger: bool = True,
3232
):
3333
# Create the agent
34-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
34+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
3535
env_id = instance.instance_id
3636
# Setup the logger properly, so you can run multi-processing to parallelize the evaluation
3737
if reset_logger:

evaluation/gaia/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ def process_instance(
4848
reset_logger: bool = True,
4949
):
5050
# Create the agent
51-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
51+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
5252
# create process-specific workspace dir
5353
# we will create a workspace directory for EACH process
5454
# so that different agent don't interfere with each other.

evaluation/gpqa/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -120,7 +120,7 @@ def process_instance(
120120
reset_logger: bool = True,
121121
):
122122
# Create the agent
123-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
123+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
124124
old_workspace_mount_path = config.workspace_mount_path
125125
old_workspace_base = config.workspace_base
126126
try:

evaluation/humanevalfix/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -108,7 +108,7 @@ def process_instance(
108108
reset_logger: bool = True,
109109
):
110110
# Create the agent
111-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
111+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
112112
old_workspace_mount_path = config.workspace_mount_path
113113
old_workspace_base = config.workspace_base
114114

evaluation/logic_reasoning/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ def process_instance(
103103
reset_logger: bool = True,
104104
):
105105
# Create the agent
106-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
106+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
107107
old_workspace_mount_path = config.workspace_mount_path
108108
old_workspace_base = config.workspace_base
109109

evaluation/miniwob/run_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ def process_instance(
4141
reset_logger: bool = True,
4242
):
4343
# Create the agent
44-
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(llm_config=metadata.llm_config))
44+
agent = Agent.get_cls(metadata.agent_class)(llm=LLM(config=metadata.llm_config))
4545
env_id = instance.id
4646
# Setup the logger properly, so you can run multi-processing to parallelize the evaluation
4747
if reset_logger:

0 commit comments

Comments
 (0)