feat: refactor model selection to use developer tiers

- Replaced raw model aliases with developer tiers (junior, medior, senior, qa) in dispatch and model selection logic. - Updated `dispatchTask` to resolve models based on tiers and plugin configuration. - Modified `selectModel` to return tier names instead of model aliases based on task description. - Implemented migration logic for transitioning from old model aliases to new tier names in worker state. - Added setup logic for agent creation and model configuration in `setup.ts`. - Created shared templates for workspace files and instructions for DEV/QA workers. - Enhanced project registration to scaffold role files based on developer tiers. - Updated task management tools to reflect changes in model selection and tier assignment. - Introduced a new `devclaw_setup` tool for agent-driven setup and configuration. - Updated plugin configuration schema to support model mapping per developer tier.
2026-02-09 13:41:22 +08:00
parent 8a79755e4c
commit aa8e8dbd1b
16 changed files with 1162 additions and 257 deletions
--- a/lib/tools/devclaw-setup.ts
+++ b/lib/tools/devclaw-setup.ts
@@ -0,0 +1,84 @@
+/**
+ * devclaw_setup — Agent-driven setup tool.
+ *
+ * Creates a new agent (optional), configures model tiers,
+ * and writes workspace files (AGENTS.md, HEARTBEAT.md, roles, memory).
+ */
+import type { OpenClawPluginApi, OpenClawPluginToolContext } from "openclaw/plugin-sdk";
+import { runSetup } from "../setup.js";
+import { ALL_TIERS, DEFAULT_MODELS, type Tier } from "../tiers.js";
+
+export function createSetupTool(api: OpenClawPluginApi) {
+  return (ctx: OpenClawPluginToolContext) => ({
+    name: "devclaw_setup",
+    description: `Set up DevClaw in an agent's workspace. Creates AGENTS.md, HEARTBEAT.md, role templates, memory/projects.json, and writes model tier config to openclaw.json. Optionally creates a new agent. Backs up existing files before overwriting.`,
+    parameters: {
+      type: "object",
+      properties: {
+        newAgentName: {
+          type: "string",
+          description: "Create a new agent with this name. If omitted, configures the current agent's workspace.",
+        },
+        models: {
+          type: "object",
+          description: `Model overrides per tier. Missing tiers use defaults. Example: { "junior": "anthropic/claude-haiku-4-5", "senior": "anthropic/claude-opus-4-5" }`,
+          properties: {
+            junior: { type: "string", description: `Junior dev model (default: ${DEFAULT_MODELS.junior})` },
+            medior: { type: "string", description: `Medior dev model (default: ${DEFAULT_MODELS.medior})` },
+            senior: { type: "string", description: `Senior dev model (default: ${DEFAULT_MODELS.senior})` },
+            qa: { type: "string", description: `QA engineer model (default: ${DEFAULT_MODELS.qa})` },
+          },
+        },
+      },
+    },
+
+    async execute(_id: string, params: Record<string, unknown>) {
+      const newAgentName = params.newAgentName as string | undefined;
+      const modelsParam = params.models as Partial<Record<Tier, string>> | undefined;
+      const workspaceDir = ctx.workspaceDir;
+
+      const result = await runSetup({
+        newAgentName,
+        // If no new agent name, use the current agent's workspace
+        agentId: newAgentName ? undefined : ctx.agentId,
+        workspacePath: newAgentName ? undefined : workspaceDir,
+        models: modelsParam,
+      });
+
+      const lines = [
+        result.agentCreated
+          ? `Agent "${result.agentId}" created`
+          : `Configured workspace for agent "${result.agentId}"`,
+        ``,
+        `Models:`,
+        ...ALL_TIERS.map((t) => `  ${t}: ${result.models[t]}`),
+        ``,
+        `Files written:`,
+        ...result.filesWritten.map((f) => `  ${f}`),
+      ];
+
+      if (result.warnings.length > 0) {
+        lines.push(``, `Warnings:`, ...result.warnings.map((w) => `  ${w}`));
+      }
+
+      lines.push(
+        ``,
+        `Next steps:`,
+        `  1. Add bot to a Telegram group`,
+        `  2. Register a project: "Register project <name> at <repo> for group <id>"`,
+        `  3. Create your first issue and pick it up`,
+      );
+
+      return {
+        content: [{
+          type: "text" as const,
+          text: JSON.stringify({
+            success: true,
+            ...result,
+            summary: lines.join("\n"),
+          }, null, 2),
+        }],
+      };
+    },
+  });
+}
--- a/lib/tools/project-register.ts
+++ b/lib/tools/project-register.ts
@@ -13,6 +13,8 @@ import { readProjects, writeProjects, emptyWorkerState } from "../projects.js";
 import { resolveRepoPath } from "../gitlab.js";
 import { createProvider } from "../providers/index.js";
 import { log as auditLog } from "../audit.js";
+import { DEV_TIERS, QA_TIERS } from "../tiers.js";
+import { DEFAULT_DEV_INSTRUCTIONS, DEFAULT_QA_INSTRUCTIONS } from "../templates.js";

 /**
 * Ensure default role files exist, then copy them into the project's role directory.
@@ -64,31 +66,6 @@ async function scaffoldRoleFiles(workspaceDir: string, projectName: string): Pro
  return created;
 }

-const DEFAULT_DEV_INSTRUCTIONS = `# DEV Worker Instructions
-
- Work in a git worktree (never switch branches in the main repo)
- Run tests before completing
- Create an MR/PR to the base branch and merge it
- Clean up the worktree after merging
- When done, call task_complete with role "dev", result "done", and a brief summary
- If you discover unrelated bugs, call task_create to file them
- Do NOT call task_pickup, queue_status, session_health, or project_register
-`;
-
-const DEFAULT_QA_INSTRUCTIONS = `# QA Worker Instructions
-
- Pull latest from the base branch
- Run tests and linting
- Verify the changes address the issue requirements
- Check for regressions in related functionality
- When done, call task_complete with role "qa" and one of:
-  - result "pass" if everything looks good
-  - result "fail" with specific issues if problems found
-  - result "refine" if you need human input to decide
- If you discover unrelated bugs, call task_create to file them
- Do NOT call task_pickup, queue_status, session_health, or project_register
-`;
-
 export function createProjectRegisterTool(api: OpenClawPluginApi) {
  return (ctx: OpenClawPluginToolContext) => ({
    name: "project_register",
@@ -186,8 +163,8 @@ export function createProjectRegisterTool(api: OpenClawPluginApi) {
        baseBranch,
        deployBranch,
        autoChain: false,
-        dev: emptyWorkerState(["haiku", "sonnet", "opus"]),
-        qa: emptyWorkerState(["grok"]),
+        dev: emptyWorkerState([...DEV_TIERS]),
+        qa: emptyWorkerState([...QA_TIERS]),
      };

      await writeProjects(workspaceDir, data);
--- a/lib/tools/task-complete.ts
+++ b/lib/tools/task-complete.ts
@@ -5,8 +5,8 @@
 * issue close/reopen, audit logging, and optional auto-chaining.
 *
 * When project.autoChain is true:
- *   - DEV "done" → automatically dispatches QA (default model: grok)
- *   - QA "fail" → automatically dispatches DEV fix (reuses previous DEV model)
+ *   - DEV "done" → automatically dispatches QA (qa tier)
+ *   - QA "fail" → automatically dispatches DEV fix (reuses previous DEV tier)
 */
 import type { OpenClawPluginApi, OpenClawPluginToolContext } from "openclaw/plugin-sdk";
 import {
@@ -120,6 +120,7 @@ export function createTaskCompleteTool(api: OpenClawPluginApi) {

        if (project.autoChain) {
          try {
+            const pluginConfig = api.pluginConfig as Record<string, unknown> | undefined;
            const issue = await getIssue(issueId, glabOpts);
            const chainResult = await dispatchTask({
              workspaceDir,
@@ -131,11 +132,12 @@ export function createTaskCompleteTool(api: OpenClawPluginApi) {
              issueDescription: issue.description ?? "",
              issueUrl: issue.web_url,
              role: "qa",
-              modelAlias: "grok",
+              modelAlias: "qa",
              fromLabel: "To Test",
              toLabel: "Testing",
              transitionLabel: (id, from, to) =>
                transitionLabel(id, from as StateLabel, to as StateLabel, glabOpts),
+              pluginConfig,
            });
            output.autoChain = {
              dispatched: true,
@@ -181,6 +183,7 @@ export function createTaskCompleteTool(api: OpenClawPluginApi) {

        if (project.autoChain && devModel) {
          try {
+            const pluginConfig = api.pluginConfig as Record<string, unknown> | undefined;
            const issue = await getIssue(issueId, glabOpts);
            const chainResult = await dispatchTask({
              workspaceDir,
@@ -197,6 +200,7 @@ export function createTaskCompleteTool(api: OpenClawPluginApi) {
              toLabel: "Doing",
              transitionLabel: (id, from, to) =>
                transitionLabel(id, from as StateLabel, to as StateLabel, glabOpts),
+              pluginConfig,
            });
            output.autoChain = {
              dispatched: true,
--- a/lib/tools/task-pickup.ts
+++ b/lib/tools/task-pickup.ts
@@ -23,7 +23,7 @@ import { dispatchTask } from "../dispatch.js";
 export function createTaskPickupTool(api: OpenClawPluginApi) {
  return (ctx: OpenClawPluginToolContext) => ({
    name: "task_pickup",
-    description: `Pick up a task from the issue queue for a DEV or QA worker. Handles everything end-to-end: label transition, model selection, session creation/reuse, task dispatch, state update, and audit logging. The orchestrator should analyze the issue and pass the appropriate model. Returns an announcement for the agent to post — no further session actions needed.`,
+    description: `Pick up a task from the issue queue for a DEV or QA worker. Handles everything end-to-end: label transition, tier assignment, session creation/reuse, task dispatch, state update, and audit logging. The orchestrator should analyze the issue and pass the appropriate developer tier. Returns an announcement for the agent to post — no further session actions needed.`,
    parameters: {
      type: "object",
      required: ["issueId", "role", "projectGroupId"],
@@ -36,7 +36,7 @@ export function createTaskPickupTool(api: OpenClawPluginApi) {
        },
        model: {
          type: "string",
-          description: "Model alias to use (e.g. haiku, sonnet, opus, grok). The orchestrator should analyze the issue complexity and choose. Falls back to keyword heuristic if omitted.",
+          description: "Developer tier (junior, medior, senior, qa). The orchestrator should evaluate the task complexity and choose the right tier. Falls back to keyword heuristic if omitted.",
        },
      },
    },
@@ -101,12 +101,13 @@ export function createTaskPickupTool(api: OpenClawPluginApi) {
        modelSource = "llm";
      } else {
        const selected = selectModel(issue.title, issue.description ?? "", role);
-        modelAlias = selected.alias;
+        modelAlias = selected.tier;
        modelReason = selected.reason;
        modelSource = "heuristic";
      }

      // 5. Dispatch via shared logic
+      const pluginConfig = api.pluginConfig as Record<string, unknown> | undefined;
      const dispatchResult = await dispatchTask({
        workspaceDir,
        agentId: ctx.agentId,
@@ -122,6 +123,7 @@ export function createTaskPickupTool(api: OpenClawPluginApi) {
        toLabel: targetLabel,
        transitionLabel: (id, from, to) =>
          transitionLabel(id, from as StateLabel, to as StateLabel, glabOpts),
+        pluginConfig,
      });

      // 6. Build result