Eval Harness
Location
examples/evals-example/How It Works
Setup
pnpm add @m4trix/evalsRun Evals
Key Files in evals-example
Config
Next
Last updated
examples/evals-example/pnpm add @m4trix/evalsLast updated
eval-agents-simple run --dataset "Demo Dataset" --evaluator "Demo Score Evaluator"eval-agents-simple run --dataset "*Demo*" --evaluator "*Score*"import { defineConfig, type ConfigType } from '@m4trix/evals';
export default defineConfig((): ConfigType => ({
discovery: {
rootDir: 'src/evals',
datasetFilePatterns: ['.dataset.ts'],
evaluatorFilePatterns: ['.evaluator.ts'],
testCaseFilePatterns: ['.test-case.ts'],
excludeDirectories: ['node_modules', 'dist'],
},
artifactDirectory: 'src/evals/.eval-results',
}));