Refine async agent and translation regressions

vaur94 · vaur94 · commit 92b38e05023b · 2026-04-23T08:59:11.000+03:00
diff --git a/packages/opencode/src/agent/agent.ts b/packages/opencode/src/agent/agent.ts
@@ -82,13 +82,17 @@ function withBugReportPrompt(agent: Info) {
   }
 }
 
-const legacyAgentTargets = {
+export const legacyAgentTargets = {
   build: "ayaz",
   general: "quick-high",
   plan: "niggli",
   explore: "explorer",
 } as const satisfies Record<string, string>
 
+export function resolveLegacyAgentTarget(name: string) {
+  return legacyAgentTargets[name as keyof typeof legacyAgentTargets] ?? name
+}
+
 function applyAgentOverride(item: Info, value: AgentOverride) {
   const next = {
     ...item,
@@ -294,9 +298,7 @@ export const layer = Layer.effect(
           }),
         ) satisfies Record<string, Info>
 
-        const get = Effect.fnUntraced(function* (agent: string) {
-          return agents[agent] ?? legacy[agent]
-        })
+        const get = (agent: string) => Effect.succeed(agents[agent] ?? legacy[agent])
 
         const list = Effect.fnUntraced(function* () {
           const cfg = yield* config.get()
diff --git a/packages/opencode/src/agent/primitive/ayaz.ts b/packages/opencode/src/agent/primitive/ayaz.ts
@@ -55,8 +55,10 @@ Execution contract:
 
 Task async delegation contract:
 - \`task_async\` is Ayaz's delegation surface for helper lanes; use it decisively when the work crosses a real lane boundary or when bounded helper work materially improves correctness, coverage, or throughput
+- Use the modern async names literally: the tool is \`task_async\` and the repository-discovery subagent is \`explorer\`; do not fall back to legacy \`task\` or \`explore\` names when you mean async helper delegation
 - Do not use \`task_async\` for vague, overlapping, or avoidable delegation; every started task must have a concrete question, bounded ownership, and clear evidence expectations
-- Use \`explorer\` when local discovery is deep enough that Ayaz would otherwise bloat context, or when location, wiring, ownership, or target narrowing is still unclear after the first narrow local pass
+- Use \`explorer\` when local discovery is deep enough that Ayaz would otherwise bloat context, when location, wiring, ownership, or target narrowing is still unclear after the first narrow local pass, or when the user explicitly asks for exhaustive investigation or multi-thread evidence gathering
+- If you are about to do three or more non-overlapping discovery passes yourself, stop and launch focused \`task_async\` \`explorer\` work instead of hoarding all discovery inside Ayaz
 - Use \`librarian\` for web research, official docs, release behavior, package semantics, framework details, or upstream implementation questions that depend on external sources
 - Do not continue broad external research inside Ayaz when \`librarian\` is the correct lane; hand the research off, then reconcile the returned evidence with repository reality and the current implementation target
 - Use \`architect\` when a meaningful design, boundary, ownership, contract, storage, migration, or rollout decision remains open after normal repository and external evidence gathering
diff --git a/packages/opencode/src/team/memory.ts b/packages/opencode/src/team/memory.ts
@@ -793,7 +793,9 @@ export namespace TeamMemory {
           throw new Error("atlas_private must be curated by atlas")
         }
         if (featureArea(area)) {
-          if (input.actor !== "atlas") throw new Error("feature_memory must be curated by atlas")
+          if (!["atlas", "ayaz"].includes(input.actor)) {
+            throw new Error("feature_memory must be curated by atlas or ayaz")
+          }
           if (!scope) throw new Error("scope is required for feature_memory")
           if ((input.class ?? Class.enum.knowledge) !== Class.enum.knowledge) {
             throw new Error("feature_memory must use class=knowledge")
diff --git a/packages/opencode/src/tool/shared/truncate.ts b/packages/opencode/src/tool/shared/truncate.ts
@@ -109,7 +109,7 @@ export namespace Truncate {
         yield* fs.writeFileString(file, text).pipe(Effect.orDie)
 
         const hint = hasTaskTool(agent)
-          ? `The tool call succeeded but the output was truncated. Full output saved to: ${file}\nUse task_async to have the explore agent process this file with inspect/search. Do NOT read the full file yourself - delegate to save context.`
+          ? `The tool call succeeded but the output was truncated. Full output saved to: ${file}\nUse task_async to have the explorer subagent process this file with inspect/search. Do NOT read the full file yourself - delegate to save context.`
           : `The tool call succeeded but the output was truncated. Full output saved to: ${file}\nUse Search to scan the full content or Inspect with offset/limit-style reads to view specific sections.`
 
         return {
diff --git a/packages/opencode/src/tool/task/task_async.ts b/packages/opencode/src/tool/task/task_async.ts
@@ -3,7 +3,7 @@ import z from "zod"
 import { Session } from "../../session"
 import { SessionID, MessageID } from "../../session/schema"
 import { MessageV2 } from "../../session/message-v2"
-import { Agent } from "../../agent/agent"
+import { Agent, resolveLegacyAgentTarget } from "../../agent/agent"
 import { SessionPrompt } from "../../session/prompt"
 import { SessionStatus } from "../../session/status"
 import { Config } from "../../config/config"
@@ -865,10 +865,14 @@ export const TaskAsyncTool = Tool.defineEffect(
     ) {
       const cfg = yield* config.get()
       const action = params.action
+      const requestedSubagent = action === "start" ? params.subagent_type! : undefined
+      const aliasTarget = requestedSubagent ? resolveLegacyAgentTarget(requestedSubagent) : undefined
+      const aliasAgent = aliasTarget && aliasTarget !== requestedSubagent ? yield* agent.get(aliasTarget) : undefined
+      const startSubagent = aliasAgent && aliasAgent.mode === "subagent" && !aliasAgent.hidden ? aliasTarget : requestedSubagent
 
       if (!ctx.extra?.bypassAgentCheck) {
-        const patterns = action === "start" ? [params.subagent_type!, action] : [action]
-        const always = action === "start" ? [params.subagent_type!, action] : [action]
+        const patterns = action === "start" ? [startSubagent!, action] : [action]
+        const always = action === "start" ? [startSubagent!, action] : [action]
         yield* Effect.promise(() =>
           ctx.ask({
             permission: id,
@@ -877,7 +881,7 @@ export const TaskAsyncTool = Tool.defineEffect(
             metadata: {
               action,
               description: action === "start" ? params.description : undefined,
-              subagent_type: action === "start" ? params.subagent_type : undefined,
+              subagent_type: action === "start" ? startSubagent : undefined,
               task_id: action === "start" ? undefined : params.task_id,
             },
           }),
@@ -1219,10 +1223,10 @@ export const TaskAsyncTool = Tool.defineEffect(
         }
       }
 
-      const txt = block.get(params.subagent_type!)
+      const txt = block.get(params.subagent_type!) ?? (startSubagent ? block.get(startSubagent) : undefined)
       if (txt) return yield* Effect.fail(new Error(txt))
 
-      const next = yield* agent.get(params.subagent_type!)
+      const next = yield* agent.get(startSubagent!)
       if (!next) {
         return yield* Effect.fail(new Error(`Unknown agent type: ${params.subagent_type} is not a valid agent type`))
       }
diff --git a/packages/opencode/src/tool/team-tools/memory.ts b/packages/opencode/src/tool/team-tools/memory.ts
@@ -15,7 +15,7 @@ Memory is not a scratchpad. Do not use it for live coordination, ephemeral execu
 
 Areas:
 - \`project_rules\`: prompt-safe reusable project rules
-- \`feature_memory\`: Atlas-curated validated feature-purpose and behavior notes keyed by stable \`scope\`
+- \`feature_memory\`: validated feature-purpose and behavior notes keyed by stable \`scope\`
 - \`atlas_private\`: ATLAS-only private memory that must not leak to subagents
 - \`lessons\`: shared durable knowledge, evidence, measurements, and artifacts
 
@@ -43,7 +43,7 @@ Strict rules:
 4. \`promote\` only promotes an active \`lessons\` entry into \`project_rules\`. It is not a general cross-area copy tool.
 5. \`remove\` and \`bulk_remove\` require \`reason\`. Unless \`sensitive=true\`, archive first.
 6. \`bulk_remove\` is all-or-nothing at the tool layer: if any requested \`id\` is missing or not permitted, nothing is removed.
-7. \`feature_memory\` writes are Atlas-only and require \`scope\`, \`class=knowledge\`, and \`kind=package_behavior\` or \`kind=runtime_behavior\`.
+7. \`feature_memory\` writes require \`scope\`, \`class=knowledge\`, and \`kind=package_behavior\` or \`runtime_behavior\`.
 8. Security \`finding\`/\`remediation\`/\`verification\` entries and performance \`baseline\`/\`measurement\`/\`optimization\` entries require structured \`payload\` evidence.
 9. Archive superseded entries; remove only junk, duplicates, or sensitive cleanup.`
 
@@ -581,7 +581,7 @@ function out(title: string, output: string, metadata: Meta) {
 
 function note(area: TeamMemory.Area) {
   if (area === "project_rules") return "prompt-safe reusable project rules"
-  if (area === "feature_memory") return "Atlas-curated validated feature-purpose and behavior notes"
+  if (area === "feature_memory") return "validated feature-purpose and behavior notes"
   if (area === "atlas_private") return "ATLAS-only private memory"
   return "shared durable knowledge, evidence, measurements, and artifacts"
 }
diff --git a/packages/opencode/test/team/memory-write.test.ts b/packages/opencode/test/team/memory-write.test.ts
@@ -45,4 +45,44 @@ describe("team memory write", () => {
       },
     })
   })
+
+  test("ayaz can rewrite feature memory by stable scope", async () => {
+    await using dir = await tmpdir({ git: true })
+
+    await Instance.provide({
+      directory: dir.path,
+      fn: async () => {
+        const first = await TeamMemory.write({
+          area: TeamMemory.TeamMemory.Area.enum.feature_memory,
+          kind: TeamMemory.TeamMemory.Kind.enum.package_behavior,
+          domain: TeamMemory.TeamMemory.Domain.enum.general,
+          title: "Memory tool behavior",
+          content: "first feature note",
+          scope: "tool.memory",
+          tags: ["feature", "memory"],
+          sessionID: SessionID.make("ses_test_memory"),
+          actor: "ayaz",
+        })
+
+        const second = await TeamMemory.write({
+          area: TeamMemory.TeamMemory.Area.enum.feature_memory,
+          kind: TeamMemory.TeamMemory.Kind.enum.package_behavior,
+          domain: TeamMemory.TeamMemory.Domain.enum.general,
+          title: "Memory tool behavior",
+          content: "second feature note",
+          scope: "tool.memory",
+          tags: ["feature", "memory"],
+          sessionID: SessionID.make("ses_test_memory"),
+          actor: "ayaz",
+        })
+
+        expect(second.id).toBe(first.id)
+        expect(second.content).toBe("second feature note")
+        expect(second.scope).toBe("tool.memory")
+        expect(
+          (await TeamMemory.list({ area: TeamMemory.TeamMemory.Area.enum.feature_memory, scope: "tool.memory" })).length,
+        ).toBe(1)
+      },
+    })
+  })
 })
diff --git a/packages/opencode/test/tool/ayaz-regressions.test.ts b/packages/opencode/test/tool/ayaz-regressions.test.ts
@@ -11,4 +11,11 @@ describe("ayaz source regressions", () => {
     expect(text).toContain('git_read: "allow"')
   })
 
+  test("keeps explicit async explorer delegation guidance in the prompt", async () => {
+    const text = await Bun.file(new URL("../../src/agent/primitive/ayaz.ts", import.meta.url)).text()
+    expect(text).toContain("the tool is \\\`task_async\\\` and the repository-discovery subagent is \\\`explorer\\\`")
+    expect(text).toContain("user explicitly asks for exhaustive investigation or multi-thread evidence gathering")
+    expect(text).toContain("launch focused \\\`task_async\\\` \\\`explorer\\\` work")
+  })
+
 })
diff --git a/packages/opencode/test/tool/task-async.test.ts b/packages/opencode/test/tool/task-async.test.ts
@@ -0,0 +1,112 @@
+import { afterEach, describe, expect } from "bun:test"
+import { Effect, Exit, Layer } from "effect"
+import { Agent } from "../../src/agent/agent"
+import { Config } from "../../src/config"
+import * as CrossSpawnSpawner from "../../src/effect/cross-spawn-spawner"
+import { Instance } from "../../src/project/instance"
+import { Permission } from "../../src/permission"
+import { ModelID, ProviderID } from "../../src/provider/schema"
+import { Session } from "../../src/session"
+import { MessageV2 } from "../../src/session/message-v2"
+import { MessageID } from "../../src/session/schema"
+import { ToolRegistry, Truncate } from "../../src/tool"
+import { provideTmpdirInstance } from "../fixture/fixture"
+import { testEffect } from "../lib/effect"
+
+afterEach(async () => {
+  await Instance.disposeAll()
+})
+
+const ref = {
+  providerID: ProviderID.make("test"),
+  modelID: ModelID.make("test-model"),
+}
+
+const it = testEffect(
+  Layer.mergeAll(
+    Agent.defaultLayer,
+    Config.defaultLayer,
+    CrossSpawnSpawner.defaultLayer,
+    Session.defaultLayer,
+    Truncate.defaultLayer,
+    ToolRegistry.defaultLayer,
+  ),
+)
+
+const seed = Effect.fn("TaskAsyncToolTest.seed")(function* (title = "Pinned") {
+  const session = yield* Session.Service
+  const chat = yield* session.create({ title })
+  const user = yield* session.updateMessage({
+    id: MessageID.ascending(),
+    role: "user",
+    sessionID: chat.id,
+    agent: "ayaz",
+    model: ref,
+    time: { created: Date.now() },
+  })
+  const assistant: MessageV2.Assistant = {
+    id: MessageID.ascending(),
+    role: "assistant",
+    parentID: user.id,
+    sessionID: chat.id,
+    mode: "ayaz",
+    agent: "ayaz",
+    cost: 0,
+    path: { cwd: "/tmp", root: "/tmp" },
+    tokens: { input: 0, output: 0, reasoning: 0, cache: { read: 0, write: 0 } },
+    modelID: ref.modelID,
+    providerID: ref.providerID,
+    time: { created: Date.now() },
+  }
+  yield* session.updateMessage(assistant)
+  return { chat, assistant }
+})
+
+describe("tool.task_async", () => {
+  it.live("canonicalizes the legacy explore alias before permission checks", () =>
+    provideTmpdirInstance(() =>
+      Effect.gen(function* () {
+        const registry = yield* ToolRegistry.Service
+        const tool = (yield* registry.all()).find((item) => item.id === "task_async")
+        expect(tool).toBeDefined()
+        if (!tool) throw new Error("task_async tool not found")
+
+        const { chat, assistant } = yield* seed()
+        const asks: Array<Omit<Permission.Request, "id" | "sessionID" | "tool">> = []
+        const exit = yield* Effect.exit(
+          tool.execute(
+            {
+              action: "start",
+              description: "inspect alias",
+              prompt: "look into the target",
+              subagent_type: "explore",
+            },
+            {
+              sessionID: chat.id,
+              messageID: assistant.id,
+              agent: "ayaz",
+              abort: new AbortController().signal,
+              messages: [],
+              metadata: () => Effect.void,
+              ask: (input) =>
+                Effect.sync(() => {
+                  asks.push(input)
+                  throw new Error("stop after ask")
+                }),
+            },
+          ),
+        )
+
+        expect(Exit.isFailure(exit)).toBe(true)
+        expect(asks).toHaveLength(1)
+        expect(asks[0]?.patterns).toEqual(["explorer", "start"])
+        expect(asks[0]?.always).toEqual(["explorer", "start"])
+        expect(asks[0]?.metadata).toMatchObject({
+          action: "start",
+          description: "inspect alias",
+          subagent_type: "explorer",
+        })
+      }),
+    ),
+  )
+})
diff --git a/packages/opencode/test/tool/truncation.test.ts b/packages/opencode/test/tool/truncation.test.ts
@@ -181,6 +181,9 @@ describe("Truncate", () => {
 
       expect(result.truncated).toBe(true)
       expect(result.content).toContain("The tool call succeeded but the output was truncated")
+      expect(result.content).toContain("task_async")
+      expect(result.content).toContain("explorer subagent")
+      expect(result.content).not.toContain("explore agent")
       if (!result.truncated) throw new Error("expected truncated")
       expect(result.outputPath).toContain("tool_")
     })
diff --git a/packages/ui-team/src/team-components/translation-state.test.ts b/packages/ui-team/src/team-components/translation-state.test.ts
@@ -0,0 +1,36 @@
+import { describe, expect, test } from "bun:test"
+import { resolvedTranslationStatus, translationBannerStats } from "./translation-state"
+
+describe("translation-state", () => {
+  test("active status overrides stale translated flags", () => {
+    expect(resolvedTranslationStatus({ is_translate: true, translate_status: "waiting" })).toBe("waiting")
+    expect(resolvedTranslationStatus({ is_translate: true, translate_status: "started" })).toBe("started")
+    expect(resolvedTranslationStatus({ is_translate: true, translate_status: "idle" })).toBe("finished")
+  })
+
+  test("banner counts only current-pass finished items", () => {
+    expect(
+      translationBannerStats({
+        translating: true,
+        items: [
+          { is_translate: true, translate_status: "waiting" },
+          { is_translate: true, translate_status: "waiting" },
+          { is_translate: true, translate_status: "waiting" },
+          { is_translate: true, translate_status: "waiting" },
+        ],
+      }),
+    ).toEqual({ total: 4, done: 0 })
+
+    expect(
+      translationBannerStats({
+        translating: true,
+        items: [
+          { is_translate: true, translate_status: "finished" },
+          { is_translate: true, translate_status: "started" },
+          { is_translate: true, translate_status: "waiting" },
+          { is_translate: true, translate_status: "idle" },
+        ],
+      }),
+    ).toEqual({ total: 4, done: 2 })
+  })
+})
diff --git a/packages/ui-team/src/team-components/translation-state.tsx b/packages/ui-team/src/team-components/translation-state.tsx