feat: refactor model selection to use developer tiers

- Replaced raw model aliases with developer tiers (junior, medior, senior, qa) in dispatch and model selection logic. - Updated `dispatchTask` to resolve models based on tiers and plugin configuration. - Modified `selectModel` to return tier names instead of model aliases based on task description. - Implemented migration logic for transitioning from old model aliases to new tier names in worker state. - Added setup logic for agent creation and model configuration in `setup.ts`. - Created shared templates for workspace files and instructions for DEV/QA workers. - Enhanced project registration to scaffold role files based on developer tiers. - Updated task management tools to reflect changes in model selection and tier assignment. - Introduced a new `devclaw_setup` tool for agent-driven setup and configuration. - Updated plugin configuration schema to support model mapping per developer tier.
2026-02-09 13:41:22 +08:00
parent 8a79755e4c
commit aa8e8dbd1b
16 changed files with 1162 additions and 257 deletions
--- a/lib/model-selector.ts
+++ b/lib/model-selector.ts
@@ -1,11 +1,11 @@
 /**
 * Model selection for dev/qa tasks.
- * MVP: Simple heuristic-based selection. LLM-based analysis can be added later.
+ * Keyword heuristic fallback — used when the orchestrator doesn't specify a tier.
+ * Returns tier names (junior, medior, senior, qa) instead of model aliases.
 */

 export type ModelRecommendation = {
-  model: string;
-  alias: string;
+  tier: string;
  reason: string;
 };

@@ -39,13 +39,13 @@ const COMPLEX_KEYWORDS = [
 ];

 /**
- * Select appropriate model based on task description.
+ * Select appropriate developer tier based on task description.
 *
- * Model tiers:
- * - haiku: very simple (typos, single-file fixes, CSS tweaks)
- * - grok: default QA (code inspection, validation, test runs)
- * - sonnet: default DEV (features, bug fixes, multi-file changes)
- * - opus: deep/architectural (system-wide refactoring, novel design)
+ * Developer tiers:
+ * - junior: very simple (typos, single-file fixes, CSS tweaks)
+ * - medior: standard DEV (features, bug fixes, multi-file changes)
+ * - senior: deep/architectural (system-wide refactoring, novel design)
+ * - qa: all QA tasks (code inspection, validation, test runs)
 */
 export function selectModel(
  issueTitle: string,
@@ -54,9 +54,8 @@ export function selectModel(
 ): ModelRecommendation {
  if (role === "qa") {
    return {
-      model: "github-copilot/grok-code-fast-1",
-      alias: "grok",
-      reason: "Default QA model for code inspection and validation",
+      tier: "qa",
+      reason: "Default QA tier for code inspection and validation",
    };
  }

@@ -67,8 +66,7 @@ export function selectModel(
  const isSimple = SIMPLE_KEYWORDS.some((kw) => text.includes(kw));
  if (isSimple && wordCount < 100) {
    return {
-      model: "anthropic/claude-haiku-4-5",
-      alias: "haiku",
+      tier: "junior",
      reason: `Simple task detected (keywords: ${SIMPLE_KEYWORDS.filter((kw) => text.includes(kw)).join(", ")})`,
    };
  }
@@ -77,16 +75,14 @@ export function selectModel(
  const isComplex = COMPLEX_KEYWORDS.some((kw) => text.includes(kw));
  if (isComplex || wordCount > 500) {
    return {
-      model: "anthropic/claude-opus-4-5",
-      alias: "opus",
+      tier: "senior",
      reason: `Complex task detected (${isComplex ? "keywords: " + COMPLEX_KEYWORDS.filter((kw) => text.includes(kw)).join(", ") : "long description"})`,
    };
  }

-  // Default: sonnet for standard dev work
+  // Default: medior for standard dev work
  return {
-    model: "anthropic/claude-sonnet-4-5",
-    alias: "sonnet",
+    tier: "medior",
    reason: "Standard dev task — multi-file changes, features, bug fixes",
  };
 }