From d1f264f4114415f0b8529e370940772a734a7b90 Mon Sep 17 00:00:00 2001 From: Shay Lapid <36539200+lapidshay@users.noreply.github.com> Date: Mon, 1 Jul 2024 00:09:23 +0300 Subject: [PATCH] Update evaluate.py Calculating gt_pass_rate befre evaluating the expression "gt_pass_rate > 0.99". --- bigcodebench/evaluate.py | 1 + 1 file changed, 1 insertion(+) diff --git a/bigcodebench/evaluate.py b/bigcodebench/evaluate.py index 619be0e..42a817b 100644 --- a/bigcodebench/evaluate.py +++ b/bigcodebench/evaluate.py @@ -250,6 +250,7 @@ def stucking_checker(): if flags.no_gt: cprint(f"Groundtruth is not checked", "yellow") else: + gt_pass_rate = np.mean([1 if v is not None else 0 for v in expected_time.values()]) if gt_pass_rate > 0.99: cprint(f"Groundtruth pass rate: {gt_pass_rate:.3f}", "green") else: