File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed
Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -138,8 +138,10 @@ def evaluate(flags):
138138
139139 results = compatible_eval_result (results )
140140 else :
141+ gt_pass_rate = np .mean ([1 if v is not None else 0 for v in expected_time .values ()])
141142
142143 if flags .check_gt_only :
144+
143145 if gt_pass_rate > 0.95 :
144146 cprint (f"Groundtruth pass rate: { gt_pass_rate :.3f} " , "green" )
145147 else :
@@ -244,9 +246,7 @@ def stucking_checker():
244246 mode = "-calibrated" if "sanitized-calibrated" in flags .samples else ""
245247 flags .subset = flags .subset [0 ].upper () + flags .subset [1 :]
246248 cprint (f"BigCodeBench-{ flags .subset } { mode } " , "green" )
247-
248- gt_pass_rate = np .mean ([1 if v is not None else 0 for v in expected_time .values ()])
249-
249+
250250 if flags .no_gt :
251251 cprint (f"Groundtruth is not checked" , "yellow" )
252252 else :
You can’t perform that action at this time.
0 commit comments