From 2fa4cb900667c2412b18ab036cf2b49ae0780861 Mon Sep 17 00:00:00 2001 From: YangQianli92 <108046369+YangQianli92@users.noreply.github.com> Date: Wed, 17 Apr 2024 11:23:24 +0800 Subject: [PATCH] Update base.py --- metagpt/rag/benchmark/base.py | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/metagpt/rag/benchmark/base.py b/metagpt/rag/benchmark/base.py index 0ba52e324..2634f139f 100644 --- a/metagpt/rag/benchmark/base.py +++ b/metagpt/rag/benchmark/base.py @@ -184,14 +184,13 @@ if __name__ == "__main__": answer = "是的,根据提供的信息,2023年7月20日,应急管理部和财政部确实联合发布了《因灾倒塌、损坏住房恢复重建救助工作规范》的通知。这份《规范》旨在进一步规范因灾倒塌、损坏住房的恢复重建救助相关工作。它明确了地方各级政府负责实施救助工作,应急管理部和财政部则负责统筹指导。地方财政应安排足够的资金,中央财政也会提供适当的补助。救助资金将通过专账管理,并采取特定的管理方式。救助对象是那些因自然灾害导致住房倒塌或损坏,并向政府提出申请且符合条件的受灾家庭。相关部门将组织调查统计救助对象信息,并建立档案。此外,《规范》还强调了资金发放的具体方式和公开透明的要求。" ground_truth = "“启明行动”是为了防控儿童青少年的近视问题,并发布了《防控儿童青少年近视核心知识十条》。" bleu_avg, bleu1, bleu2, bleu3, bleu4 = benchmark.bleu_score(answer, ground_truth) - logger.info(f"bleu_avg = {bleu_avg}") - logger.info(f"bleu1 = {bleu1}") - logger.info(f"bleu2 = {bleu2}") - logger.info(f"bleu3 = {bleu3}") - logger.info(f"bleu4 = {bleu4}") - rougeL_score = benchmark.rougel_score(answer, ground_truth) - logger.info(f"rougeL_score = {rougeL_score}") - similarity = asyncio.run(benchmark.SemanticSimilarity(answer, ground_truth)) - logger.info(f"similarity = {similarity}") + + logger.info( + f"BLEU Scores: bleu_avg = {bleu_avg}, bleu1 = {bleu1}, bleu2 = {bleu2}, bleu3 = {bleu3}, bleu4 = {bleu4}, " + f"RougeL Score: {rougeL_score}, " + f"Semantic Similarity: {similarity}" + ) + +