aiq.eval.evaluator.evaluator_model#
Classes#
Module Contents#
- class EvalInputItem(/, **data: Any)#
Bases:
pydantic.BaseModel
- id: Any#
- input_obj: Any#
- expected_output_obj: Any#
- output_obj: Any#
- expected_trajectory: list[aiq.data_models.intermediate_step.IntermediateStep]#
- trajectory: list[aiq.data_models.intermediate_step.IntermediateStep]#
- class EvalInput(/, **data: Any)#
Bases:
pydantic.BaseModel
- eval_input_items: list[EvalInputItem]#
- class EvalOutputItem(/, **data: Any)#
Bases:
pydantic.BaseModel
- id: Any#
- score: Any#
- reasoning: Any#
- class EvalOutput(/, **data: Any)#
Bases:
pydantic.BaseModel
- average_score: Any#
- eval_output_items: list[EvalOutputItem]#