We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0695a63 commit 7b688cdCopy full SHA for 7b688cd
bigcodebench/evaluate.py
@@ -118,11 +118,12 @@ def evaluate(flags):
118
# bypass the samples
119
flags.samples = "__dummy__.jsonl"
120
121
+ extra = flags.subset + "_" if flags.subset != "full" else ""
122
if os.path.isdir(flags.samples):
- result_path = os.path.join(flags.samples, "eval_results.json")
123
+ result_path = os.path.join(flags.samples, f"{extra}eval_results.json")
124
else:
125
assert flags.samples.endswith(".jsonl")
- result_path = flags.samples.replace(".jsonl", "_eval_results.json")
126
+ result_path = flags.samples.replace(".jsonl", f"_{extra}eval_results.json")
127
128
problems = get_bigcodebench(subset=flags.subset)
129
dataset_hash = get_bigcodebench_hash(subset=flags.subset)
0 commit comments