2026-06-12 14:02:15 +08:00
|
|
|
scenario_name: sample-pdf-question-bank-online
|
|
|
|
|
mode: online
|
|
|
|
|
dataset: ../../datasets/raw/generated/sample-pdf-question-bank.csv
|
2026-06-16 18:12:33 +08:00
|
|
|
judge_model: qwen3.5-flash
|
2026-06-12 14:02:15 +08:00
|
|
|
embedding_model: text-embedding-v3
|
|
|
|
|
metrics:
|
2026-06-16 18:12:33 +08:00
|
|
|
- faithfulness
|
|
|
|
|
- answer_relevancy
|
|
|
|
|
- context_recall
|
|
|
|
|
- context_precision
|
2026-06-12 14:02:15 +08:00
|
|
|
output_dir: ../../outputs/online/sample-pdf-question-bank
|
|
|
|
|
runtime:
|
|
|
|
|
batch_size: 2
|
|
|
|
|
app_concurrency: 2
|
|
|
|
|
metric_concurrency: 2
|
|
|
|
|
max_samples: 45
|
|
|
|
|
app_adapter:
|
|
|
|
|
type: python
|
|
|
|
|
callable: apps.pdf_question_bank.adapter:run
|
|
|
|
|
static_kwargs:
|
|
|
|
|
source_chunks_path: ../../outputs/dataset-builds/sample-pdf-question-bank/latest/source_chunks.jsonl
|
2026-06-16 18:12:33 +08:00
|
|
|
model: glm-5
|