We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent afbf8de commit 32324d2Copy full SHA for 32324d2
bigcodebench/evaluate.py
@@ -276,6 +276,12 @@ def stucking_checker():
276
if not os.path.isfile(result_path):
277
with open(result_path, "w") as f:
278
json.dump(results, f, indent=2)
279
+
280
+ pass_at_k_path = result_path.replace("_eval_results.json", "_pass_at_k.json")
281
+ pass_at_k["model"] = flags.samples.split("/")[-1].replace(".jsonl", "")
282
+ pass_at_k["subset"] = flags.subset
283
+ with open(pass_at_k_path, "w") as f:
284
+ json.dump(pass_at_k, f, indent=2)
285
286
287
def main():
0 commit comments