From 9d2f3925ae559db8aab359fdbe7df201084aaa7c Mon Sep 17 00:00:00 2001 From: Kevin Lin Date: Wed, 8 Jan 2025 14:55:19 -0800 Subject: [PATCH] update eval --- evaluate_gsm8k.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/evaluate_gsm8k.py b/evaluate_gsm8k.py index 0bf5611693..17f15c4ae6 100644 --- a/evaluate_gsm8k.py +++ b/evaluate_gsm8k.py @@ -99,7 +99,7 @@ def evaluate(input_file: str): example_num_rethinks.append(num_rethinks) print("Accuracy (any correct): ", any_correct_count / total) - print("Accuracy (final): ", correct / total) + print("Accuracy (majority vote): ", correct / total) with jsonlines.open(input_file) as reader: lines = list(reader) print("avg. num rethinks: ", statistics.mean(example_num_rethinks))