We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4aa2e44 commit 229dbc2Copy full SHA for 229dbc2
bigcodebench/evaluate.py
@@ -50,7 +50,7 @@ def get_groundtruth(problems, hashcode, check_gt_only):
50
expected_time = {}
51
for task_id, problem in tqdm(problems.items()):
52
expected_time[task_id] = trusted_exec(
53
- problem["complete_prompt"] + "\n" + problem["clean_canonical_solution"],
+ problem["complete_prompt"] + "\n" + problem["canonical_solution"],
54
problem["test"],
55
problem["task_id"],
56
)
0 commit comments