'function login(username, password) {\n if (!username) throw new Error("Missing username");\n // BUG: missing password check\n return true;\n}',
}asconst;
describe('tracker_mode',()=>{
evalTest('USUALLY_PASSES',{
name:'should manage tasks in the tracker when explicitly requested during a bug fix',
params:{
settings:{experimental:{taskTracker: true}},
},
files: FILES,
prompt:
'We have a bug in src/login.js: the password check is missing. First, create a task in the tracker to fix it. Then fix the bug, and mark the task as closed.',
name:'should implicitly create tasks when asked to build a feature plan',
params:{
settings:{experimental:{taskTracker: true}},
},
files: FILES,
prompt:
'I need to build a complex new feature for user authentication in our project. Create a detailed implementation plan and organize the work into bite-sized chunks. Do not actually implement the code yet, just plan it.',
assert: async(rig,result)=>{
// The model should proactively use tracker_create_task to organize the work
constwasToolCalled=awaitrig.waitForToolCall(
TRACKER_CREATE_TASK_TOOL_NAME,
);
expect(
wasToolCalled,
'Expected tracker_create_task to be called implicitly to organize plan',