Skip to content

Commit

Permalink
logname fix; improve test calling instruction (All-Hands-AI#3666)
Browse files Browse the repository at this point in the history
  • Loading branch information
tobitege committed Aug 30, 2024
1 parent 99139e9 commit dbb671a
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 3 deletions.
5 changes: 3 additions & 2 deletions evaluation/aider_bench/run_infer.py
Original file line number Diff line number Diff line change
Expand Up @@ -177,9 +177,10 @@ def process_instance(
signature_file=f'{instance.instance_name}.py',
)
if USE_UNIT_TESTS:
print(f'\nInstruction to run test_file: {instance.instance_name}_test.py\n')
instruction += (
f'Use the test_file: {instance.instance_name}_test.py, to verify '
'the correctness of your solution. DO NOT EDIT the test file.\n\n'
f'Use `python -m unittest {instance.instance_name}_test.py` to run the test_file '
'and verify the correctness of your solution. DO NOT EDIT the test file.\n\n'
)

instruction += (
Expand Down
3 changes: 2 additions & 1 deletion evaluation/utils/shared.py
Original file line number Diff line number Diff line change
Expand Up @@ -139,13 +139,14 @@ def make_metadata(
details: dict[str, Any] | None = None,
) -> EvalMetadata:
model_name = llm_config.model.split('/')[-1]
model_path = model_name.replace(':', '_')
eval_note = f'_N_{eval_note}' if eval_note else ''

eval_output_path = os.path.join(
eval_output_dir,
dataset_name,
agent_class,
f'{model_name}_maxiter_{max_iterations}{eval_note}',
f'{model_path}_maxiter_{max_iterations}{eval_note}',
)

pathlib.Path(eval_output_path).mkdir(parents=True, exist_ok=True)
Expand Down

0 comments on commit dbb671a

Please sign in to comment.