匹配字符

import re
from tqdm import tqdm

Evaluate the model on the MATH dataset

correct = 0
total = 0

for example in tqdm(dataset):
prompt = example['problem']
ans = re.findall(r'\boxed{([+-]?\d+)}', example['solution'])

generated_ans = generate_answer(prompt)
parsed_ans = re.findall(r'\\boxed\{([+-]?\d+)\}', generated_ans)

if parsed_ans == ans:
    correct += 1
total += 1

accuracy = correct / total
print(f"Accuracy: {accuracy * 100:.2f}%")

从dataset数据集中选取一部分样本
A = dataset.select(range(20))

posted @ 2024-12-30 19:35  HaibaraYuki  阅读(5)  评论(0)    收藏  举报