sunilp · sunilp · Mar 20, 2026 · Mar 20, 2026 · Mar 20, 2026 · Mar 20, 2026
diff --git a/docs/plans/2026-03-20-jam-agent-engine.md b/docs/plans/2026-03-20-jam-agent-engine.md
diff --git a/docs/specs/2026-03-20-jam-agent-engine-design.md b/docs/specs/2026-03-20-jam-agent-engine-design.md
diff --git a/src/agent/config.test.ts b/src/agent/config.test.ts
@@ -0,0 +1,45 @@
+import { describe, it, expect } from 'vitest';
+import { JamConfigSchema } from '../config/schema.js';
+
+describe('agent config schema', () => {
+  it('provides defaults when agent section is omitted', () => {
+    const result = JamConfigSchema.parse({});
+    expect(result.agent).toBeDefined();
+    expect(result.agent.maxWorkers).toBe(3);
+    expect(result.agent.defaultMode).toBe('supervised');
+    expect(result.agent.maxRoundsPerWorker).toBe(20);
+    expect(result.agent.sandbox.filesystem).toBe('workspace-only');
+    expect(result.agent.sandbox.network).toBe('allowed');
+    expect(result.agent.sandbox.timeout).toBe(60000);
+    expect(result.agent.permissions.safe).toEqual([]);
+    expect(result.agent.permissions.dangerous).toEqual([]);
+  });
+
+  it('validates custom agent config', () => {
+    const result = JamConfigSchema.parse({
+      agent: {
+        maxWorkers: 5,
+        defaultMode: 'auto',
+        permissions: { safe: ['npm test'], dangerous: ['docker rm'] },
+        sandbox: { filesystem: 'unrestricted', network: 'blocked', timeout: 30000 },
+      },
+    });
+    expect(result.agent.maxWorkers).toBe(5);
+    expect(result.agent.defaultMode).toBe('auto');
+    expect(result.agent.permissions.safe).toEqual(['npm test']);
+    expect(result.agent.sandbox.network).toBe('blocked');
+  });
+
+  it('rejects invalid mode', () => {
+    expect(() => JamConfigSchema.parse({ agent: { defaultMode: 'yolo' } })).toThrow();
+  });
+
+  it('rejects maxWorkers < 1', () => {
+    expect(() => JamConfigSchema.parse({ agent: { maxWorkers: 0 } })).toThrow();
+  });
+
+  it('rejects maxRoundsPerWorker out of bounds', () => {
+    expect(() => JamConfigSchema.parse({ agent: { maxRoundsPerWorker: 0 } })).toThrow();
+    expect(() => JamConfigSchema.parse({ agent: { maxRoundsPerWorker: 51 } })).toThrow();
+  });
+});
diff --git a/src/agent/errors.test.ts b/src/agent/errors.test.ts
@@ -0,0 +1,19 @@
+import { describe, it, expect } from 'vitest';
+import { JamError } from '../utils/errors.js';
+
+const AGENT_CODES = [
+  'AGENT_PLAN_FAILED', 'AGENT_PLAN_CYCLE', 'AGENT_WORKER_TIMEOUT',
+  'AGENT_WORKER_CANCELLED', 'AGENT_FILE_LOCK_CONFLICT', 'AGENT_FILE_LOCK_TIMEOUT',
+  'AGENT_BUDGET_EXCEEDED', 'AGENT_SANDBOX_UNAVAILABLE', 'AGENT_RATE_LIMITED',
+  'AGENT_MERGE_CONFLICT',
+] as const;
+
+describe('agent error codes', () => {
+  for (const code of AGENT_CODES) {
+    it(`creates JamError with code ${code}`, () => {
+      const err = new JamError(`test ${code}`, code);
+      expect(err.code).toBe(code);
+      expect(err.hint).toBeDefined();
+    });
+  }
+});
diff --git a/src/agent/file-lock.test.ts b/src/agent/file-lock.test.ts
@@ -0,0 +1,72 @@
+import { describe, it, expect } from 'vitest';
+import { FileLockManager } from './file-lock.js';
+
+describe('FileLockManager', () => {
+  it('assigns ownership from plan', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [
+      { path: 'src/a.ts', mode: 'create' },
+      { path: 'src/b.ts', mode: 'modify' },
+    ]);
+    expect(mgr.getOwner('src/a.ts')).toBe('w1');
+    expect(mgr.getOwner('src/b.ts')).toBe('w1');
+  });
+
+  it('grants request for unowned file', () => {
+    const mgr = new FileLockManager();
+    const resp = mgr.requestFile({ workerId: 'w1', path: 'src/c.ts', reason: 'need it' });
+    expect(resp.granted).toBe(true);
+    expect(mgr.getOwner('src/c.ts')).toBe('w1');
+  });
+
+  it('grants request for own file', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [{ path: 'src/a.ts', mode: 'modify' }]);
+    const resp = mgr.requestFile({ workerId: 'w1', path: 'src/a.ts', reason: 'already mine' });
+    expect(resp.granted).toBe(true);
+  });
+
+  it('denies request for file owned by another worker', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [{ path: 'src/a.ts', mode: 'modify' }]);
+    const resp = mgr.requestFile({ workerId: 'w2', path: 'src/a.ts', reason: 'need it' });
+    expect(resp.granted).toBe(false);
+    expect(resp.waitForWorker).toBe('w1');
+  });
+
+  it('releases all locks for a worker', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [
+      { path: 'src/a.ts', mode: 'create' },
+      { path: 'src/b.ts', mode: 'modify' },
+    ]);
+    mgr.releaseAll('w1');
+    expect(mgr.getOwner('src/a.ts')).toBeUndefined();
+    expect(mgr.getOwner('src/b.ts')).toBeUndefined();
+  });
+
+  it('grants file after previous owner releases', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [{ path: 'src/a.ts', mode: 'modify' }]);
+    mgr.releaseAll('w1');
+    const resp = mgr.requestFile({ workerId: 'w2', path: 'src/a.ts', reason: 'now free' });
+    expect(resp.granted).toBe(true);
+  });
+
+  it('detects deadlock (cycle in wait graph)', () => {
+    const mgr = new FileLockManager();
+    mgr.assignOwnership('w1', [{ path: 'src/a.ts', mode: 'modify' }]);
+    mgr.assignOwnership('w2', [{ path: 'src/b.ts', mode: 'modify' }]);
+    // w1 waits for w2's file
+    mgr.requestFile({ workerId: 'w1', path: 'src/b.ts', reason: 'need b' });
+    // Now w2 wants w1's file — this would create a deadlock
+    const resp = mgr.requestFile({ workerId: 'w2', path: 'src/a.ts', reason: 'need a' });
+    expect(resp.granted).toBe(false);
+    // detectDeadlock should return true internally
+  });
+
+  it('returns undefined owner for unknown path', () => {
+    const mgr = new FileLockManager();
+    expect(mgr.getOwner('nonexistent')).toBeUndefined();
+  });
+});
diff --git a/src/agent/file-lock.ts b/src/agent/file-lock.ts
@@ -0,0 +1,81 @@
+import type { FileOwnership, FileLockRequest, FileLockResponse } from './types.js';
+
+export class FileLockManager {
+  // Maps file path → owner worker ID
+  private owners = new Map<string, string>();
+  // Maps worker ID → set of file paths they own
+  private workerFiles = new Map<string, Set<string>>();
+  // Wait graph: worker ID → worker ID they're waiting on (for deadlock detection)
+  private waitGraph = new Map<string, string>();
+
+  /** Bulk assign ownership from plan */
+  assignOwnership(workerId: string, files: FileOwnership[]): void {
+    for (const file of files) {
+      this.owners.set(file.path, workerId);
+      if (!this.workerFiles.has(workerId)) {
+        this.workerFiles.set(workerId, new Set());
+      }
+      this.workerFiles.get(workerId)!.add(file.path);
+    }
+  }
+
+  /** Request access to a file not originally owned */
+  requestFile(request: FileLockRequest): FileLockResponse {
+    const owner = this.owners.get(request.path);
+
+    // No owner → grant immediately
+    if (!owner) {
+      this.owners.set(request.path, request.workerId);
+      if (!this.workerFiles.has(request.workerId)) {
+        this.workerFiles.set(request.workerId, new Set());
+      }
+      this.workerFiles.get(request.workerId)!.add(request.path);
+      return { granted: true };
+    }
+
+    // Already own it
+    if (owner === request.workerId) return { granted: true };
+
+    // Check for deadlock before adding to wait graph
+    if (this.detectDeadlock(request.workerId, owner)) {
+      return { granted: false, waitForWorker: owner };
+      // Caller (orchestrator) handles the deadlock
+    }
+
+    // Not available — caller must wait
+    this.waitGraph.set(request.workerId, owner);
+    return { granted: false, waitForWorker: owner };
+  }
+
+  /** Release all locks held by a worker */
+  releaseAll(workerId: string): void {
+    const files = this.workerFiles.get(workerId);
+    if (files) {
+      for (const path of files) {
+        this.owners.delete(path);
+      }
+      this.workerFiles.delete(workerId);
+    }
+    this.waitGraph.delete(workerId);
+  }
+
+  /** Get owner of a file */
+  getOwner(path: string): string | undefined {
+    return this.owners.get(path);
+  }
+
+  /** Check if granting would create a deadlock (cycle in wait graph) */
+  detectDeadlock(requestingWorker: string, waitForWorker: string): boolean {
+    // DFS from waitForWorker through wait graph
+    // If we reach requestingWorker, it's a cycle (deadlock)
+    const visited = new Set<string>();
+    let current: string | undefined = waitForWorker;
+    while (current) {
+      if (current === requestingWorker) return true;
+      if (visited.has(current)) break;
+      visited.add(current);
+      current = this.waitGraph.get(current);
+    }
+    return false;
+  }
+}
diff --git a/src/agent/index.ts b/src/agent/index.ts
@@ -0,0 +1,16 @@
+export * from './types.js';
+export { PermissionClassifier, classifyCommand, isHardBlocked, ApprovalTracker } from './permissions.js';
+export { detectSandboxStrategy, buildSandboxArgs, executeSandboxed } from './sandbox.js';
+export type { SandboxStrategy } from './sandbox.js';
+export { getTextContent, hasImages, flattenForProvider, loadImage } from './multimodal.js';
+export { FileLockManager } from './file-lock.js';
+export { ProviderPool } from './provider-pool.js';
+export type { ProviderLease } from './provider-pool.js';
+export { buildWorkspaceProfile, formatProfileForPrompt, computeProfileHash, loadCachedProfile } from './workspace-intel.js';
+export { generateTaskPlan, estimateTokenCost } from './planner.js';
+export { executeWorker } from './worker.js';
+export type { WorkerDeps } from './worker.js';
+export { Orchestrator } from './orchestrator.js';
+export type { OrchestratorDeps, OrchestratorOptions, OrchestratorResult, ProgressEvent } from './orchestrator.js';
+export { ProgressReporter, createProgressReporter } from './progress.js';
+export type { OutputMode } from './progress.js';
diff --git a/src/agent/integration.test.ts b/src/agent/integration.test.ts
@@ -0,0 +1,142 @@
+import { describe, it, expect, vi, beforeEach, type Mock } from 'vitest';
+import { Orchestrator } from './orchestrator.js';
+import type { ProgressEvent } from './orchestrator.js';
+import type { ProviderAdapter } from '../providers/base.js';
+import type { Subtask, SubtaskContext } from './types.js';
+
+// Mock workspace-intel to avoid filesystem dependency
+vi.mock('./workspace-intel.js', () => ({
+  buildWorkspaceProfile: vi.fn().mockResolvedValue({
+    language: 'typescript', monorepo: false, srcLayout: 'src/',
+    entryPoints: ['src/index.ts'], codeStyle: {
+      indent: 'spaces', indentSize: 2, quotes: 'single',
+      semicolons: true, trailingCommas: true, namingConvention: 'camelCase',
+    },
+    fileNaming: 'kebab-case.ts', exportStyle: 'barrel', importStyle: 'relative',
+    errorHandling: 'JamError', logging: 'Logger', configPattern: 'cosmiconfig',
+    testFramework: 'vitest', testLocation: 'co-located', testNaming: '*.test.ts',
+    testStyle: 'describe/it', testCommand: 'npm test', commitConvention: 'conventional',
+    branchPattern: 'feat/*', packageManager: 'npm', typeChecker: 'tsc',
+  }),
+  formatProfileForPrompt: vi.fn().mockReturnValue('TypeScript project'),
+}));
+
+// Mock planner to return a 2-subtask plan with dependency
+vi.mock('./planner.js', () => ({
+  generateTaskPlan: vi.fn().mockResolvedValue({
+    goal: 'Add greeting feature',
+    subtasks: [
+      {
+        id: '1', description: 'Create greeting module',
+        files: [{ path: 'src/greeting.ts', mode: 'create' }],
+        estimatedRounds: 5,
+      },
+      {
+        id: '2', description: 'Add tests for greeting',
+        files: [{ path: 'src/greeting.test.ts', mode: 'create' }],
+        estimatedRounds: 5,
+        validationCommand: 'npm test',
+      },
+    ],
+    dependencyGraph: new Map([['1', []], ['2', ['1']]]),
+  }),
+  estimateTokenCost: vi.fn().mockReturnValue(10000),
+}));
+
+// Mock worker to simulate completing subtasks
+let _workerCallCount = 0;
+vi.mock('./worker.js', () => ({
+  executeWorker: vi.fn().mockImplementation((subtask: Subtask) => {
+    _workerCallCount++;
+    return Promise.resolve({
+      subtaskId: subtask.id,
+      status: 'completed',
+      filesChanged: [{ path: subtask.files[0]?.path ?? 'unknown', action: 'created', diff: '' }],
+      summary: `Completed subtask ${subtask.id}: ${subtask.description}`,
+      tokensUsed: { promptTokens: 200, completionTokens: 100, totalTokens: 300 },
+    });
+  }),
+}));
+
+const mockAdapter = {
+  info: { name: 'mock', supportsStreaming: true, supportsTools: true },
+  validateCredentials: vi.fn(),
+  streamCompletion: vi.fn(),
+  listModels: vi.fn(),
+  chatWithTools: vi.fn(),
+} as unknown as ProviderAdapter;
+
+describe('Agent Engine Integration', () => {
+  beforeEach(() => {
+    _workerCallCount = 0;
+    vi.clearAllMocks();
+  });
+
+  it('orchestrates a 2-subtask plan end-to-end', async () => {
+    const orch = new Orchestrator({
+      adapter: mockAdapter,
+      workspaceRoot: '/workspace',
+      toolSchemas: [],
+      executeTool: vi.fn().mockResolvedValue('ok'),
+    });
+
+    const events: ProgressEvent[] = [];
+    const result = await orch.execute('add a greeting feature', {
+      mode: 'auto',
+      maxWorkers: 2,
+      onProgress: (e) => events.push(e),
+    });
+
+    // Plan was generated
+    expect(result.plan.goal).toBe('Add greeting feature');
+    expect(result.plan.subtasks).toHaveLength(2);
+
+    // Both subtasks completed
+    expect(result.results).toHaveLength(2);
+    expect(result.results.every(r => r.status === 'completed')).toBe(true);
+
+    // Dependency order: subtask 1 before subtask 2
+    expect(result.results[0].subtaskId).toBe('1');
+    expect(result.results[1].subtaskId).toBe('2');
+
+    // Files tracked
+    expect(result.filesChanged).toContain('src/greeting.ts');
+    expect(result.filesChanged).toContain('src/greeting.test.ts');
+
+    // Token usage aggregated
+    expect(result.totalTokens.totalTokens).toBe(600); // 300 * 2
+
+    // Progress events fired
+    expect(events.some(e => e.type === 'plan-ready')).toBe(true);
+    expect(events.filter(e => e.type === 'worker-started')).toHaveLength(2);
+    expect(events.filter(e => e.type === 'worker-completed')).toHaveLength(2);
+    expect(events.some(e => e.type === 'all-done')).toBe(true);
+
+    // Summary contains both subtask results
+    expect(result.summary).toContain('1:');
+    expect(result.summary).toContain('2:');
+  });
+
+  it('worker receives prior context from dependency', async () => {
+    const { executeWorker } = await import('./worker.js');
+
+    const orch = new Orchestrator({
+      adapter: mockAdapter,
+      workspaceRoot: '/workspace',
+      toolSchemas: [],
+      executeTool: vi.fn().mockResolvedValue('ok'),
+    });
+
+    await orch.execute('test', { mode: 'auto', maxWorkers: 1 });
+
+    // Second worker call should have received context from first
+    const mockFn = executeWorker as unknown as Mock;
+    const calls = mockFn.mock.calls as Array<[Subtask, SubtaskContext, ...unknown[]]>;
+    expect(calls).toHaveLength(2);
+
+    // Second call's context should reference subtask 1's output
+    const secondCallContext = calls[1][1]; // context parameter
+    expect(secondCallContext.priorSummary).toContain('subtask 1');
+    expect(secondCallContext.filesAvailable).toContain('src/greeting.ts');
+  });
+});