langchain/tests/unit_tests/evaluation/criteria/test_eval_chain.py

32 lines
1015 B
Python
Raw Normal View History

"""Test the criteria eval chain."""
from langchain.evaluation.criteria.eval_chain import (
HELPFULNESS_CRITERION,
CriteriaEvalChain,
)
from langchain.evaluation.schema import StringEvaluator
from tests.unit_tests.llms.fake_llm import FakeLLM
def test_resolve_criteria() -> None:
assert CriteriaEvalChain.resolve_criteria("helpfulness") == HELPFULNESS_CRITERION
assert CriteriaEvalChain.resolve_criteria(["helpfulness"]) == HELPFULNESS_CRITERION
def test_criteria_eval_chain() -> None:
chain = CriteriaEvalChain.from_llm(
llm=FakeLLM(
queries={"text": "The meaning of life\nY"}, sequential_responses=True
),
criteria={"my criterion": "my criterion description"},
)
result = chain.evaluate_strings(
prediction="my prediction", reference="my reference", input="my input"
)
assert result["reasoning"] == "The meaning of life"
def test_implements_string_protocol() -> None:
assert isinstance(CriteriaEvalChain, StringEvaluator)