update
This commit is contained in:
@@ -69,7 +69,13 @@ def build_models(
|
||||
"""
|
||||
client_kwargs = _resolve_openai_client_kwargs(judge_model, settings)
|
||||
client = AsyncOpenAI(**client_kwargs)
|
||||
llm = llm_factory(judge_model, client=client)
|
||||
# RAGAS structured-output judge calls can be truncated by the upstream default
|
||||
# 1024 completion budget, especially for faithfulness and GPT-5 family models.
|
||||
llm = llm_factory(
|
||||
judge_model,
|
||||
client=client,
|
||||
max_tokens=max(1, int(settings.ragas_llm_max_tokens)),
|
||||
)
|
||||
embeddings = embedding_factory(provider="openai", model=embedding_model, client=client)
|
||||
return llm, embeddings
|
||||
|
||||
|
||||
Reference in New Issue
Block a user