Evaluation
Evaluating the output of your agentic system
Configuring your application
"autoload-dev": {
"psr-4": {
"App\\Evaluators\\": "evaluators/"
}
},Creating Evaluator
namespace App\Evaluators;
use NeuronAI\Evaluation\Assertions\StringContains;
use NeuronAI\Evaluation\BaseEvaluator;
use NeuronAI\Evaluation\Contracts\DatasetInterface;
use NeuronAI\Evaluation\Dataset\JsonDataset;
class AgentEvaluator extends BaseEvaluator
{
public function getDataset(): DatasetInterface
{
return new JsonDataset(__DIR__ . '/datasets/dataset.json');
}
public function run(array $datasetItem): mixed
{
$response = MyAgent::make()->chat(
new UserMessage($datasetItem['input'])
)->getMessage();
return $response->getContent();
}
public function evaluate(mixed $output, array $datasetItem): void
{
$this->assert(
new StringContains($datasetItem['reference']),
$output,
);
}
} Defining The Dataset
ArrayDataset
JsonDataset
Running Evaluations
Last updated