debug(evals): add debug logging and exclude nulllinter from vitest

This commit is contained in:
Alisa Novikova
2026-04-08 22:45:09 -07:00
parent 90ff8feb4c
commit ce26052630
3 changed files with 8 additions and 2 deletions
+2 -2
View File
@@ -15,8 +15,8 @@ describe('Related Eval Demonstration', () => {
},
prompt: 'What is in test.txt?',
assert: async (rig: TestRig, result: string) => {
// This assertion is designed to fail.
expect(result).toContain('THE MODEL WILL NEVER SAY THIS EXACT SENTENCE');
// This assertion is GUARANTEED TO FAIL.
expect(1).toBe(2);
},
});
});
+1
View File
@@ -21,6 +21,7 @@ export default defineConfig({
json: 'evals/logs/report.json',
},
include: ['**/*.eval.ts'],
exclude: ['**/node_modules/**', '**/dist/**', '**/nulllinter/**'],
environment: 'node',
globals: true,
alias: {
+5
View File
@@ -245,12 +245,17 @@ async function processResults(firstPass, pattern, model, files) {
let totalProcessed = 0;
for (const fileResult of firstPass.testResults) {
console.log(`\nDebug: Processing file ${fileResult.name}`);
for (const assertion of fileResult.assertionResults) {
if (assertion.status !== 'passed' && assertion.status !== 'failed') {
console.log(
` - Skipping test: ${assertion.title} (status: ${assertion.status})`,
);
continue;
}
const name = assertion.title;
console.log(` - Test: ${name} (status: ${assertion.status})`);
results[name] = {
passed: assertion.status === 'passed' ? 1 : 0,
total: 1,