We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ce4831c commit a5bff4aCopy full SHA for a5bff4a
bigcodebench/evaluate.py
@@ -142,7 +142,7 @@ def evaluate(flags):
142
143
if flags.check_gt_only:
144
145
- if gt_pass_rate > 0.95:
+ if gt_pass_rate > 0.99:
146
cprint(f"Groundtruth pass rate: {gt_pass_rate:.3f}", "green")
147
else:
148
cprint(f"Groundtruth pass rate: {gt_pass_rate:.3f}\nPlease be cautious!", "red")
@@ -250,7 +250,7 @@ def stucking_checker():
250
if flags.no_gt:
251
cprint(f"Groundtruth is not checked", "yellow")
252
253
254
255
256
0 commit comments