improve(core): require recurrence evidence before extracting skills (#25147)

2026-04-20 10:10:56 -07:00 · 2026-04-15 11:45:31 -07:00
parent 5333e5ab20
commit 485f3d92d8
4 changed files with 502 additions and 22 deletions
@@ -0,0 +1,90 @@
+/**
+ * @license
+ * Copyright 2026 Google LLC
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+import { describe, expect, it } from 'vitest';
+import { SkillExtractionAgent } from './skill-extraction-agent.js';
+import {
+  EDIT_TOOL_NAME,
+  GLOB_TOOL_NAME,
+  GREP_TOOL_NAME,
+  LS_TOOL_NAME,
+  READ_FILE_TOOL_NAME,
+  WRITE_FILE_TOOL_NAME,
+} from '../tools/tool-names.js';
+import { PREVIEW_GEMINI_FLASH_MODEL } from '../config/models.js';
+
+describe('SkillExtractionAgent', () => {
+  const skillsDir = '/tmp/skills';
+  const sessionIndex =
+    '[NEW] Debug login flow (12 user msgs) — /tmp/chats/session-1.json';
+  const existingSkillsSummary =
+    '## Workspace Skills (.gemini/skills — do NOT duplicate)\n- **existing-skill**: Existing description';
+
+  const agent = SkillExtractionAgent(
+    skillsDir,
+    sessionIndex,
+    existingSkillsSummary,
+  );
+
+  it('should expose expected metadata, model, and tools', () => {
+    expect(agent.kind).toBe('local');
+    expect(agent.name).toBe('confucius');
+    expect(agent.displayName).toBe('Skill Extractor');
+    expect(agent.modelConfig.model).toBe(PREVIEW_GEMINI_FLASH_MODEL);
+    expect(agent.toolConfig?.tools).toEqual(
+      expect.arrayContaining([
+        READ_FILE_TOOL_NAME,
+        WRITE_FILE_TOOL_NAME,
+        EDIT_TOOL_NAME,
+        LS_TOOL_NAME,
+        GLOB_TOOL_NAME,
+        GREP_TOOL_NAME,
+      ]),
+    );
+  });
+
+  it('should default to no skill unless recurrence and durability are proven', () => {
+    const prompt = agent.promptConfig.systemPrompt;
+
+    expect(prompt).toContain('Default to NO SKILL.');
+    expect(prompt).toContain(
+      'strong evidence this will recur for future agents in this repo/workflow',
+    );
+    expect(prompt).toContain('broader than a single incident');
+    expect(prompt).toContain('A skill MUST meet ALL of these criteria:');
+    expect(prompt).toContain(
+      'Future agents in this repo/workflow are likely to need it',
+    );
+  });
+
+  it('should explicitly reject one-off incidents and single-session preferences', () => {
+    const prompt = agent.promptConfig.systemPrompt;
+
+    expect(prompt).toContain('Single-session preferences');
+    expect(prompt).toContain('One-off incidents');
+    expect(prompt).toContain('Output-style preferences');
+    expect(prompt).toContain('cannot survive renaming the specific');
+  });
+
+  it('should warn that session summaries are user-intent summaries, not workflow evidence', () => {
+    const query = agent.promptConfig.query ?? '';
+
+    expect(query).toContain(existingSkillsSummary);
+    expect(query).toContain(sessionIndex);
+    expect(query).toContain(
+      'The summary is a user-intent summary, not a workflow summary.',
+    );
+    expect(query).toContain(
+      'The session summaries describe user intent, not workflow details.',
+    );
+    expect(query).toContain(
+      'Only write a skill if the evidence shows a durable, recurring workflow',
+    );
+    expect(query).toContain(
+      'If recurrence or future reuse is unclear, create no skill and explain why.',
+    );
+  });
+});
@@ -36,7 +36,7 @@ function buildSystemPrompt(skillsDir: string): string {
    '- solve similar tasks with fewer tool calls and fewer reasoning tokens',
    '- reuse proven workflows and verification checklists',
    '- avoid known failure modes and landmines',
-    '- anticipate user preferences without being reminded',
+    '- capture durable workflow constraints that future agents are likely to encounter again',
    '',
    '============================================================',
    'SAFETY AND HYGIENE (STRICT)',
@@ -59,6 +59,10 @@ function buildSystemPrompt(skillsDir: string): string {
    '1. "Is this something a competent agent would NOT already know?" If no, STOP.',
    '2. "Does an existing skill (listed below) already cover this?" If yes, STOP.',
    '3. "Can I write a concrete, step-by-step procedure?" If no, STOP.',
+    '4. "Is there strong evidence this will recur for future agents in this repo/workflow?" If no, STOP.',
+    '5. "Is this broader than a single incident (one bug, one ticket, one branch, one date, one exact error)?" If no, STOP.',
+    '',
+    'Default to NO SKILL.',
    '',
    'Do NOT create skills for:',
    '',
@@ -67,6 +71,10 @@ function buildSystemPrompt(skillsDir: string): string {
    '- **Pure Q&A**: The user asked "how does X work?" and got an answer. No procedure.',
    '- **Brainstorming/design**: Discussion of how to build something, without a validated',
    '  implementation that produced a reusable procedure.',
+    '- **Single-session preferences**: User-specific style/output preferences or workflow',
+    '  preferences mentioned only once.',
+    '- **One-off incidents**: Debugging or incident response tied to a single bug, ticket,',
+    '  branch, date, or exact error string.',
    '- **Anything already covered by an existing skill** (global, workspace, builtin, or',
    '  previously extracted). Check the "Existing Skills" section carefully.',
    '',
@@ -74,31 +82,40 @@ function buildSystemPrompt(skillsDir: string): string {
    'WHAT COUNTS AS A SKILL',
    '============================================================',
    '',
-    'A skill MUST meet BOTH of these criteria:',
+    'A skill MUST meet ALL of these criteria:',
    '',
    '1. **Procedural and concrete**: It can be expressed as numbered steps with specific',
    '   commands, paths, or code patterns. If you can only write vague guidance, it is NOT',
    '   a skill. "Be careful with X" is advice, not a skill.',
    '',
-    '2. **Non-obvious and project-specific**: A competent agent would NOT already know this.',
-    '   It encodes project-specific knowledge, non-obvious ordering constraints, or',
-    '   hard-won failure shields that cannot be inferred from the codebase alone.',
+    '2. **Durable and reusable**: Future agents in this repo/workflow are likely to need it',
+    '   again. If it only solved one incident, it is NOT a skill.',
    '',
-    'Confidence tiers (prefer higher tiers):',
+    '3. **Evidence-backed and project-specific**: It encodes project-specific knowledge,',
+    '   repeated operational constraints, or hard-won failure shields supported by session',
+    '   evidence. Do not assume something is non-obvious just because it sounds detailed.',
    '',
-    '**High confidence** — create the skill:',
-    '- The same workflow appeared in multiple sessions (cross-session repetition)',
-    '- A multi-step procedure was validated (tests passed, user confirmed success)',
+    'Confidence tiers:',
    '',
-    '**Medium confidence** — create the skill if it is clearly project-specific:',
-    '- A project-specific build/test/deploy/release procedure was established',
-    '- A non-obvious ordering constraint or prerequisite was discovered',
-    '- A failure mode was hit and a concrete fix was found and verified',
+    '**High confidence** — create the skill only when recurrence/durability is clear:',
+    '- The same workflow appeared in multiple sessions (cross-session repetition), OR it is',
+    '  a stable recurring repo workflow (for example setup/build/test/deploy/release) with a',
+    '  clear future trigger',
+    '- The workflow was validated (tests passed, user confirmed success, or the same fix',
+    '  worked repeatedly)',
+    '- The skill can be named without referencing a specific incident, bug, branch, or date',
+    '',
+    '**Medium confidence** — usually do NOT create the skill yet:',
+    '- A project-specific procedure appeared once and seems useful, but recurrence is not yet',
+    '  clear',
+    '- A verified fix exists, but it is still tied to one incident',
+    '- A user correction changed the approach once, but durability is uncertain',
    '',
    '**Low confidence** — do NOT create the skill:',
    '- A one-off debugging session with no reusable procedure',
    '- Generic workflows any agent could figure out from the codebase',
    '- A code review or investigation with no durable takeaway',
+    '- Output-style preferences that do not materially change procedure',
    '',
    'Aim for 0-2 skills per run. Quality over quantity.',
    '',
@@ -117,8 +134,10 @@ function buildSystemPrompt(skillsDir: string): string {
    '',
    'What to look for:',
    '',
-    '- User corrections: "No, do it this way" -> preference signal',
+    '- User corrections that change procedure in a durable way, especially when repeated',
+    '  across sessions',
    '- Repeated patterns across sessions: same commands, same file paths, same workflow',
+    '- Stable recurring repo lifecycle workflows with clear future triggers',
    '- Failed attempts followed by successful ones -> failure shield',
    '- Multi-step procedures that were validated (tests passed, user confirmed)',
    '- User interruptions: "Stop, you need to X first" -> ordering constraint',
@@ -129,6 +148,8 @@ function buildSystemPrompt(skillsDir: string): string {
    '- Tool outputs that are just data (file contents, search results)',
    '- Speculative plans that were never executed',
    "- Temporary context (current branch name, today's date, specific error IDs)",
+    '- Similar session summaries without matching workflow evidence',
+    '- One-off artifact names: bug IDs, branch names, timestamps, exact incident strings',
    '',
    '============================================================',
    'SKILL FORMAT',
@@ -214,7 +235,10 @@ function buildSystemPrompt(skillsDir: string): string {
    '- Keep scopes distinct. Avoid overlapping "do-everything" skills.',
    '- Every skill MUST have: triggers, procedure, at least one pitfall or verification step.',
    '- If you cannot write a reliable procedure (too many unknowns), do NOT create the skill.',
-    '- Do not create skills for generic advice that any competent agent would already know.',
+    '- If the candidate is tied to one incident or cannot survive renaming the specific',
+    '  bug/ticket, do NOT create it.',
+    '- Do not create skills for generic advice, output-style preferences, or ephemeral',
+    '  choices that any competent agent would already know or adapt to on the fly.',
    '- Prefer fewer, higher-quality skills. 0-2 skills per run is typical. 3+ is unusual.',
    '',
    '============================================================',
@@ -224,17 +248,23 @@ function buildSystemPrompt(skillsDir: string): string {
    `1. Use list_directory on ${skillsDir} to see existing skills.`,
    '2. If skills exist, read their SKILL.md files to understand what is already captured.',
    '3. Scan the session index provided in the query. Look for [NEW] sessions whose summaries',
-    '   suggest workflows that ALSO appear in other sessions (either [NEW] or [old]).',
-    '4. Apply the minimum signal gate. If no repeated patterns are visible, report that and finish.',
+    '   hint at workflows that ALSO appear in other sessions (either [NEW] or [old]) or at a',
+    '   stable recurring repo workflow. Remember: summary similarity alone is NOT enough.',
+    '4. Apply the minimum signal gate. If recurrence or durability is not visible, report that',
+    '   no skill should be created and finish.',
    '5. For promising patterns, use read_file on the session file paths to inspect the full',
-    '   conversation. Confirm the workflow was actually repeated and validated.',
-    '6. For each confirmed skill, verify it meets ALL criteria (repeatable, procedural, high-leverage).',
+    '   conversation. Confirm the workflow was actually repeated and validated. Read at least',
+    '   two sessions unless the candidate is clearly a stable recurring repo lifecycle workflow.',
+    '6. For each candidate, verify it meets ALL criteria. Before writing, make sure you can',
+    '   state: future trigger, evidence sessions, recurrence signal, validation signal, and',
+    '   why it is not generic.',
    '7. Write new SKILL.md files or update existing ones in your directory using write_file.',
    '   For skills that live OUTSIDE your directory, write a .patch file instead (see UPDATING EXISTING SKILLS).',
    '8. Write COMPLETE files — never partially update a SKILL.md.',
    '',
    'IMPORTANT: Do NOT read every session. Only read sessions whose summaries suggest a',
-    'repeated pattern worth investigating. Most runs should read 0-3 sessions and create 0 skills.',
+    'repeated pattern or a stable recurring repo workflow worth investigating. Most runs',
+    'should read 0-3 sessions and create 0 skills.',
    'Do not explore the codebase. Work only with the session index, session files, and the skills directory.',
  ].join('\n');
 }
@@ -301,6 +331,9 @@ export const SkillExtractionAgent = (
        'Below is an index of past conversation sessions. Each line shows:',
        '[NEW] or [old] status, a 1-line summary, message count, and the file path.',
        '',
+        'The summary is a user-intent summary, not a workflow summary.',
+        'Matching summary text alone is never enough evidence for a reusable skill.',
+        '',
        '[NEW] = not yet processed for skill extraction (focus on these)',
        '[old] = previously processed (read only if a [NEW] session hints at a repeated pattern)',
        '',
@@ -319,7 +352,7 @@ export const SkillExtractionAgent = (

    return {
      systemPrompt: buildSystemPrompt(skillsDir),
-      query: `${initialContext}\n\nAnalyze the session index above. Read sessions that suggest repeated workflows using read_file. Extract reusable skills to ${skillsDir}/.`,
+      query: `${initialContext}\n\nAnalyze the session index above. The session summaries describe user intent, not workflow details. Read sessions that suggest repeated workflows using read_file. Only write a skill if the evidence shows a durable, recurring workflow or a stable recurring repo procedure. If recurrence or future reuse is unclear, create no skill and explain why.`,
    };
  },
  runConfig: {