Skip to content

Commit b8b0f8c

Browse files
authored
Update summarize_results.py
1 parent 7c34ad4 commit b8b0f8c

File tree

1 file changed

+0
-10
lines changed

1 file changed

+0
-10
lines changed

evaluation/summarize_results.py

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -87,16 +87,6 @@ def main():
8787
os.makedirs(task_dirname, exist_ok=True)
8888
metric_path = os.path.join(task_dirname, "metrics.json")
8989
pred_path = os.path.join(task_dirname, "predictions.json")
90-
if 'math6' in dataset.lower() and task == 'cot':
91-
data_to_score = []
92-
for pred in task2pred[task]:
93-
item = deepcopy(pred['metadata'])
94-
item['model_answer_turns_1'] = pred['turns'][0]['model_output']
95-
item['model_answer_turns_2'] = pred['turns'][1]['model_output']
96-
data_to_score.append(item)
97-
_metrics = math6_score(data_to_score)
98-
task2metric[task].update(_metrics)
99-
model2dataset2task2metric[model][dataset][task].update(_metrics)
10090
json.dump(task2metric[task], open(metric_path, "w"), indent=4)
10191
json.dump(task2pred[task], open(pred_path, "w"), indent=4)
10292
if 'minif2f' in dataset.lower() and 'isabelle' in dataset.lower() and task2pred[task] and args.eval_atp:

0 commit comments

Comments
 (0)