2026-06-12 14:02:15 +08:00
|
|
|
|
"""Supported metric names recognized by scenario validation and pipeline setup."""
|
|
|
|
|
|
|
|
|
|
|
|
SUPPORTED_METRICS = {
|
2026-06-16 18:12:33 +08:00
|
|
|
|
# Core retrieval / generation metrics (always available).
|
2026-06-12 14:02:15 +08:00
|
|
|
|
"faithfulness",
|
|
|
|
|
|
"answer_relevancy",
|
|
|
|
|
|
"context_recall",
|
|
|
|
|
|
"context_precision",
|
2026-06-16 18:12:33 +08:00
|
|
|
|
# Robustness and end-to-end metrics (see 架构设计 §10.2).
|
|
|
|
|
|
"noise_sensitivity", # 鲁棒性:对检索噪声的敏感度
|
|
|
|
|
|
"factual_correctness", # 端到端:回答相对标准答案的事实正确性
|
|
|
|
|
|
"semantic_similarity", # 端到端:回答与标准答案的语义相似度(embedding,无 LLM 调用)
|
2026-06-12 14:02:15 +08:00
|
|
|
|
}
|