Compare commits
36 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| 6d0034dc88 | |||
| a153291643 | |||
| a0619f9740 | |||
| f478088797 | |||
| e2b749d42e | |||
| c747d3e8be | |||
| d9927558d5 | |||
| 895d9f95a1 | |||
| 30352a3603 | |||
| d58fd0bdde | |||
| 0799cfc644 | |||
| 70ee21856d | |||
| b7d02ee4a4 | |||
| 8e50049ba5 | |||
| da528cc493 | |||
| a8b50f5109 | |||
| 4b7d16247d | |||
| 70f9f720e6 | |||
| 93967feb68 | |||
| 07e5e70c9b | |||
| f7fff95cbe | |||
| d3186cde06 | |||
| d6ba76e660 | |||
| 04c4489e70 | |||
| 5fb285cf46 | |||
| 2306493a77 | |||
| a416413c7d | |||
| e8c6c5c917 | |||
| 4de1f65c10 | |||
| 6902c37ced | |||
| bbabd2dc0a | |||
| 99df4fe4e2 | |||
| 8527df24b3 | |||
| 4a58aa1657 | |||
| e31afe3b59 | |||
| ab6af144b7 |
@@ -0,0 +1,19 @@
|
||||
name: CI
|
||||
on:
|
||||
push:
|
||||
branches: [main, "phase/*", "milestone/*"]
|
||||
pull_request:
|
||||
branches: [main]
|
||||
jobs:
|
||||
build-and-test:
|
||||
runs-on: ubuntu-latest
|
||||
steps:
|
||||
- uses: actions/checkout@v4
|
||||
- uses: actions/setup-node@v4
|
||||
with:
|
||||
node-version: '20'
|
||||
- run: npm ci
|
||||
- run: npm run typecheck
|
||||
- run: npm run build
|
||||
- run: npm test
|
||||
- run: npm pack --dry-run
|
||||
@@ -0,0 +1,20 @@
|
||||
name: Publish to npm
|
||||
on:
|
||||
push:
|
||||
tags: ['v*']
|
||||
jobs:
|
||||
publish:
|
||||
runs-on: ubuntu-latest
|
||||
steps:
|
||||
- uses: actions/checkout@v4
|
||||
- uses: actions/setup-node@v4
|
||||
with:
|
||||
node-version: '20'
|
||||
registry-url: 'https://registry.npmjs.org'
|
||||
- run: npm ci
|
||||
- run: npm run typecheck
|
||||
- run: npm run build
|
||||
- run: npm test
|
||||
- run: npm publish --access public
|
||||
env:
|
||||
NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}
|
||||
Executable
+80
@@ -0,0 +1,80 @@
|
||||
#!/bin/bash
|
||||
# CI pre-push hook: enforce versioning and branching rules
|
||||
# Install: git config core.hooksPath .githooks
|
||||
|
||||
zero="0000000000000000000000000000000000000000"
|
||||
|
||||
while read local_ref local_oid remote_ref remote_oid; do
|
||||
if [ "$local_oid" = "$zero" ]; then
|
||||
continue
|
||||
fi
|
||||
|
||||
# Check pushed tags
|
||||
if echo "$local_ref" | grep -qE "^refs/tags/"; then
|
||||
tag_name=$(echo "$local_ref" | sed 's|^refs/tags/||')
|
||||
|
||||
# Validate semver format
|
||||
if echo "$tag_name" | grep -qE "^v[0-9]+\.[0-9]+\.[0-9]+$"; then
|
||||
tag_major=$(echo "$tag_name" | sed 's/v\([0-9]*\)\.[0-9]*\.[0-9]*/\1/')
|
||||
tag_minor=$(echo "$tag_name" | sed 's/v[0-9]*\.\([0-9]*\)\.[0-9]*/\1/')
|
||||
tag_patch=$(echo "$tag_name" | sed 's/v[0-9]*\.[0-9]*\.\([0-9]*\)/\1/')
|
||||
|
||||
# Check for semver ordering violations
|
||||
for existing_tag in $(git tag -l "v${tag_major}.${tag_minor}.*" 2>/dev/null); do
|
||||
if [ "$existing_tag" = "$tag_name" ]; then
|
||||
continue
|
||||
fi
|
||||
existing_patch=$(echo "$existing_tag" | sed 's/v[0-9]*\.[0-9]*\.\([0-9]*\)/\1/')
|
||||
if [ "$existing_patch" -ge "$tag_patch" ] && [ "$tag_patch" -le "$existing_patch" ]; then
|
||||
echo "ERROR: Tag $tag_name is not greater than existing tag $existing_tag"
|
||||
echo " Milestone tags must be the NEXT version (e.g., v0.6.0 after v0.5.1-5, NOT v0.5.0)"
|
||||
exit 1
|
||||
fi
|
||||
done
|
||||
|
||||
# Check for milestone-tags-below-phase-tags
|
||||
# If this is a .0 tag (milestone), verify no .N tags exist with higher patch
|
||||
if [ "$tag_patch" = "0" ]; then
|
||||
for existing_tag in $(git tag -l "v${tag_major}.${tag_minor}.*" 2>/dev/null); do
|
||||
existing_patch=$(echo "$existing_tag" | sed 's/v[0-9]*\.[0-9]*\.\([0-9]*\)/\1/')
|
||||
if [ "$existing_patch" -gt 0 ] && [ "$existing_patch" -gt "$tag_patch" ]; then
|
||||
echo "ERROR: Milestone tag $tag_name is below existing phase tags (e.g., $existing_tag)"
|
||||
echo " Feature milestone completion must be tagged as v${tag_major}.$(($tag_minor + 1)).0, not v${tag_major}.${tag_minor}.0"
|
||||
exit 1
|
||||
fi
|
||||
done
|
||||
fi
|
||||
fi
|
||||
fi
|
||||
|
||||
# Check branch merges: reject direct-to-main pushes if milestone branch exists
|
||||
if echo "$local_ref" | grep -qE "^refs/heads/main$"; then
|
||||
milestone_branches=$(git branch -r 2>/dev/null | grep 'milestone/v' | grep -v ':$' || true)
|
||||
if [ -n "$milestone_branches" ]; then
|
||||
# Allow if this is a merge commit from a milestone branch
|
||||
merge_parents=$(git cat-file -p "$local_oid" 2>/dev/null | grep "^parent" | wc -l)
|
||||
if [ "$merge_parents" -lt 2 ]; then
|
||||
# Not a merge commit — check if there are active milestone branches
|
||||
active_milestones=""
|
||||
for mb in $milestone_branches; do
|
||||
clean_name=$(echo "$mb" | sed 's|^[^/]*/||' | tr -d ' ')
|
||||
merged=$(git branch -r --merged origin/main 2>/dev/null | grep "$clean_name" || true)
|
||||
if [ -z "$merged" ]; then
|
||||
active_milestones="$active_milestones $clean_name"
|
||||
fi
|
||||
done
|
||||
if [ -n "$active_milestones" ]; then
|
||||
echo "WARNING: Pushing directly to main while active milestone branches exist:"
|
||||
for ms in $active_milestones; do
|
||||
echo " - $ms"
|
||||
done
|
||||
echo " Phase branches should merge into the milestone branch first."
|
||||
# Warning only — not blocking. The code-level enforcement in git-branch.ts
|
||||
# is the hard gate; this hook is a safety net.
|
||||
fi
|
||||
fi
|
||||
fi
|
||||
fi
|
||||
done
|
||||
|
||||
exit 0
|
||||
@@ -1,4 +1,4 @@
|
||||
# AGENTS.md — CI Project Guidelines
|
||||
# AGENTS.md — CIAgent Project Guidelines
|
||||
|
||||
## Build & Run Commands
|
||||
|
||||
@@ -9,38 +9,40 @@
|
||||
|
||||
## Project Overview
|
||||
|
||||
CI (Continuous Intelligence) is a fully autonomous AI-driven software engineering harness. It receives a specification, resolves ambiguities through a single Clarify phase, then executes the full pipeline (research → plan → execute → verify) autonomously, escalating only when it cannot safely proceed alone.
|
||||
CIAgent (Continuous Intelligence) is a fully autonomous AI-driven software engineering harness. It receives a specification, resolves ambiguities through a single Clarify phase, then executes the full pipeline (research → plan → execute → verify) autonomously, escalating only when it cannot safely proceed alone.
|
||||
|
||||
## Architecture
|
||||
|
||||
```
|
||||
src/
|
||||
agents/ # 18 agent implementations (persona loaders delegating to backends)
|
||||
agents/ # 19 agent implementations (persona loaders delegating to backends)
|
||||
backends/ # Intelligence backend layer
|
||||
types.ts # IntelligenceBackend, BackendRequest, BackendResult, BackendConfigSection
|
||||
tool-registry.ts # CI-owned tool implementations (readFile, writeFile, editFile, runBash, glob, grep)
|
||||
ollama-base.ts # Abstract base for Ollama backends (shared tool loop, prompt construction)
|
||||
tool-registry.ts # CIAgent-owned tool implementations (readFile, writeFile, editFile, runBash, glob, grep)
|
||||
llm-base.ts # Abstract base for LLM backends (shared tool loop, prompt construction)
|
||||
ollama-local.ts # OllamaLocalBackend (localhost:11434)
|
||||
ollama-cloud.ts # OllamaCloudBackend (remote endpoint, auth, rate limiting)
|
||||
openai.ts # OpenAIBackend (OpenAI API, gpt-4o)
|
||||
anthropic.ts # AnthropicBackend (Anthropic API, Claude)
|
||||
opencode.ts # OpencodeBackend (shells out to opencode --non-interactive)
|
||||
index.ts # Backend registry + auto-detection
|
||||
cli/ # Commander.js CLI (commands.ts, index.ts)
|
||||
core/ # Core engine components
|
||||
artifacts.ts # Legacy .ci/ artifact management (retained for backward compat)
|
||||
audit.ts # Legacy audit trail in .ci/audit/ (retained for backward compat)
|
||||
ci-files.ts # .ci/ long-lived reference file management (PROJECT.md, ROADMAP.md, etc.)
|
||||
core/ # Core engine components
|
||||
artifacts.ts # Legacy .ciagent/ artifact management (retained for backward compat)
|
||||
audit.ts # Git-native audit trail — reads decisions/escalations from git log
|
||||
ciagent-files.ts # .ciagent/ long-lived reference file management (PROJECT.md, ROADMAP.md, etc.)
|
||||
clarify.ts # Clarify phase: question generation, default acceptance
|
||||
commit-builder.ts # Structured commit message generation (---ci--- YAML blocks)
|
||||
commit-parser.ts # ---ci--- YAML block extraction and parsing
|
||||
config.ts # .ci/config.json load/save/init
|
||||
config.ts # .ciagent/config.json load/save/init
|
||||
decision-engine.ts # Bounded rationality: commits decisions as git artifacts
|
||||
error-recovery.ts # Retry, plan revision, rollback logic
|
||||
escalation.ts # Escalation protocol: commits escalations as git artifacts
|
||||
git-branch.ts # Branch lifecycle: phase/NN-slug, milestone/vX.X-slug
|
||||
git-context.ts # Project state reconstruction from git log + branches
|
||||
types/ # Type definitions
|
||||
commit-meta.ts # CiMetadata, CommitDecision, CommitEscalation, ParsedCiCommit
|
||||
config.ts # CIConfig, AutonomyLevel, ModelProfile, DEFAULT_CI_CONFIG (includes backend)
|
||||
commit-meta.ts # CIAgentMetadata, CommitDecision, CommitEscalation, ParsedCIAgentCommit
|
||||
config.ts # CIAgentConfig, AutonomyLevel, ModelProfile, DEFAULT_CIAGENT_CONFIG (includes backend)
|
||||
decisions.ts # Decision, ConfidenceLevel, DecisionCategory
|
||||
escalation.ts # Escalation, EscalationType, EscalationResolution
|
||||
clarify.ts # ClarifyQuestion, ClarifyResult
|
||||
@@ -53,7 +55,7 @@ src/
|
||||
security.ts # Layer 3: regex-based threat pattern scanning (no STRIDE analysis yet)
|
||||
quality.ts # Layer 4: regex-based code quality checks (no multi-persona review yet)
|
||||
index.ts # Public API exports
|
||||
version.ts # VERSION = "0.4.0"
|
||||
version.ts # VERSION = "0.9.0"
|
||||
templates/ # Template files (config.json, DECISIONS.md, specification.md)
|
||||
```
|
||||
|
||||
@@ -62,9 +64,9 @@ templates/ # Template files (config.json, DECISIONS.md, specification.md
|
||||
- **Autonomy levels**: `full` (no HITL after clarify), `supervised` (escalate on gates + verification failures), `guided` (escalate on every decision gate)
|
||||
- **Decision confidence thresholds**: High (>0.85) auto-decide and log; Medium (0.60–0.85) auto-decide with assumption logging; Low (<0.60) escalate to human
|
||||
- **Escalation timeout**: Default 5 minutes, then auto-proceeds with recommended option. Set to `0` to require human, `-1` to always auto-proceed
|
||||
- **18 agents** purpose-built for CI, all configured for autonomous operation. OrchestratorAgent is CI-specific
|
||||
- **Git-native context**: The git log IS the project memory. Agent's first impulse to gather context is `git log` + `git branch`, not file reads. Dynamic state (decisions, escalations, lessons, compounding) lives in `---ci---` YAML blocks in commit messages. `.ci/` holds only long-lived reference docs (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md, config.json).
|
||||
- **Artifact compatibility**: CI no longer writes `.planning/` schema. Dynamic state is derived from git history. `.ci/` files follow a CI-native schema.
|
||||
- **19 agents** purpose-built for CIAgent, all configured for autonomous operation. OrchestratorAgent is CIAgent-specific
|
||||
- **Git-native context**: The git log IS the project memory. Agent's first impulse to gather context is `git log` + `git branch`, not file reads. Dynamic state (decisions, escalations, lessons, compounding) lives in `---ci---` YAML blocks in commit messages. `.ciagent/` holds only long-lived reference docs (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md, config.json).
|
||||
- **Artifact compatibility**: CIAgent no longer writes `.planning/` schema. `.ciagent/` files follow a CIAgent-native schema.
|
||||
|
||||
## Code Conventions
|
||||
|
||||
@@ -73,7 +75,7 @@ templates/ # Template files (config.json, DECISIONS.md, specification.md
|
||||
- **Agent pattern**: All agents extend `BaseAgent` with `name` (AgentName), `description`, `workflow`, and `execute(context: AgentContext): Promise<AgentResult>`. Agents delegate to `context.backend` when available, fail honestly when not.
|
||||
- **No runtime validation library**: Uses plain TypeScript types, not Zod schemas (Zod is a dependency but types are hand-defined)
|
||||
- **File I/O**: Use `src/utils/file.ts` helpers (`writeFile`, `readFile`, `ensureDir`, `readJSON`, `writeJSON`) instead of raw `fs` calls in agent/business logic
|
||||
- **Config**: `CIConfig` type and `DEFAULT_CI_CONFIG` in `src/types/config.ts` — always merge partial configs with defaults
|
||||
- **Config**: `CIAgentConfig` type and `DEFAULT_CIAGENT_CONFIG` in `src/types/config.ts` — always merge partial configs with defaults
|
||||
- **Error handling**: Agents return `{ success: false, error: string }` rather than throwing
|
||||
- **No comments in code**: Follow existing pattern — agent files have no comments
|
||||
- **Naming**: `camelCase` for functions/variables, `PascalCase` for classes/types/interfaces, `kebab-case` for file names
|
||||
@@ -82,29 +84,30 @@ templates/ # Template files (config.json, DECISIONS.md, specification.md
|
||||
## Pipeline Flow
|
||||
|
||||
```
|
||||
SPECIFY → CLARIFY → RESEARCH → PLAN → EXECUTE → VERIFY → COMPLETE
|
||||
SPECIFY → CLARIFY → RESEARCH → IDEATE → PLAN → EXECUTE → TEST → VERIFY → COMPLETE
|
||||
```
|
||||
|
||||
Each stage is executed by `OrchestratorAgent.executeStage()`. The orchestrator delegates intelligent stages (research, plan, execute, verify) to specialized agents via `context.backend` when available, falling back to mechanical execution when no backend is configured. Mechanical stages (specify, clarify, complete) are always handled by the orchestrator directly.
|
||||
Each stage is executed by `OrchestratorAgent.executeStage()`. The orchestrator delegates intelligent stages (research, plan, execute, test, verify) to specialized agents via `context.backend` when available, falling back to mechanical execution when no backend is configured. Mechanical stages (specify, clarify, complete) are always handled by the orchestrator directly.
|
||||
|
||||
## Intelligence Backend Architecture
|
||||
|
||||
```
|
||||
IntelligenceBackend (unified interface)
|
||||
├── LLMBackend (CI runs tool loop, provides tools, constructs prompts)
|
||||
├── LLMBackend (CIAgent runs tool loop, provides tools, constructs prompts)
|
||||
│ ├── OllamaLocalBackend (localhost:11434, no auth)
|
||||
│ ├── OllamaCloudBackend (remote endpoint, API key, rate limits)
|
||||
│ └── (future: OpenAI, Anthropic, Gemini, etc.)
|
||||
└── AgentBackend (agent runs own tool loop, CI sends request)
|
||||
│ ├── OpenAIBackend (OpenAI API, gpt-4o, API key auth)
|
||||
│ └── AnthropicBackend (Anthropic API, Claude, API key auth)
|
||||
└── AgentBackend (agent runs own tool loop, CIAgent sends request)
|
||||
├── OpencodeBackend (opencode --non-interactive)
|
||||
└── (future: Codex, Claude Code, Hermes, etc.)
|
||||
```
|
||||
|
||||
- **LLM backends**: CI constructs system prompts from persona.md + workflow.md, defines tool schemas, runs the tool-call loop via `ToolRegistry`, and parses structured JSON output
|
||||
- **Agent backends**: CI serializes `BackendRequest`, invokes the agent, and parses JSON `BackendResult` from stdout
|
||||
- **Auto-detection** (provider: "auto"): tries opencode → ollama-local → ollama-cloud → fails with instructions
|
||||
- **Per-command override**: `ci run --backend ollama-local` forces a specific backend
|
||||
- **Config**: `backend` section in `.ci/config.json` with provider, fallback, agent_backends, llm_backends
|
||||
- **LLM backends**: CIAgent constructs system prompts from persona.md + workflow.md, defines tool schemas, runs the tool-call loop via `ToolRegistry`, and parses structured JSON output
|
||||
- **Agent backends**: CIAgent serializes `BackendRequest`, invokes the agent, and parses JSON `BackendResult` from stdout
|
||||
- **Auto-detection** (provider: "auto"): tries opencode → openai → ollama-local → ollama-cloud → anthropic → fails with instructions
|
||||
- **Per-command override**: `ciagent run --backend ollama-local` forces a specific backend (options: opencode, openai, anthropic, ollama-local, ollama-cloud)
|
||||
- **Config**: `backend` section in `.ciagent/config.json` with provider, fallback, agent_backends, llm_backends
|
||||
|
||||
## Agent Modification Rules (from PRD)
|
||||
|
||||
@@ -122,26 +125,26 @@ IntelligenceBackend (unified interface)
|
||||
## Verification Layers
|
||||
|
||||
1. **Structural**: Files exist, imports wired, no stubs/TODOs
|
||||
2. **Behavioral**: Check test infrastructure and requirement traceability (static analysis — test generation not yet implemented)
|
||||
3. **Security**: Regex-based threat pattern scanning with auto-disposition (STRIDE analysis not yet implemented)
|
||||
4. **Code Quality**: Regex-based code quality checks (multi-persona review not yet implemented)
|
||||
2. **Behavioral**: Test execution and requirement traceability — runs test framework, parses results, reports pass/fail per suite
|
||||
3. **Security**: Full STRIDE threat pattern scanning with CWE mapping and confidence-based auto-disposition
|
||||
4. **Code Quality**: 3-persona code review (security, performance, maintainability) with P0/P1/P2 findings
|
||||
|
||||
## Testing
|
||||
|
||||
- Test framework: Jest with ts-jest
|
||||
- Test file pattern: `**/*.test.ts` in `src/`
|
||||
- Run: `npm run test`
|
||||
- 25 test suites, 218 tests covering types, core, git-native, verification, and utility modules
|
||||
- 58 test suites, 561 tests covering types, core, git-native, verification, agent, backends, ideation, multi-project, and utility modules
|
||||
- Tests use temp directories (os.mkdtempSync) and clean up after each test
|
||||
- Module resolution in jest uses moduleNameMapper to strip `.js` extensions
|
||||
|
||||
## Important Files
|
||||
|
||||
- `.ci/config.json` — Project-level CI configuration (autonomy, parallelization, verification, security, git)
|
||||
- `.ci/PROJECT.md` — Vision, core value, requirements, constraints, key decisions table
|
||||
- `.ci/ARCHITECTURE.md` — System architecture, component boundaries, data flow
|
||||
- `.ci/ROADMAP.md` — Phase breakdown, milestone mapping, success criteria, progress table
|
||||
- `.ci/REQUIREMENTS.md` — v1/v2 requirements with REQ-IDs and traceability matrix
|
||||
- `.ciagent/config.json` — Project-level CIAgent configuration (autonomy, parallelization, verification, security, git)
|
||||
- `.ciagent/PROJECT.md` — Vision, core value, requirements, constraints, key decisions table
|
||||
- `.ciagent/ARCHITECTURE.md` — System architecture, component boundaries, data flow
|
||||
- `.ciagent/ROADMAP.md` — Phase breakdown, milestone mapping, success criteria, progress table
|
||||
- `.ciagent/REQUIREMENTS.md` — v1/v2 requirements with REQ-IDs and traceability matrix
|
||||
- Git log — Primary project memory: decisions, escalations, lessons, compounding, verification results
|
||||
- Branch structure — `phase/NN-slug` (active/complete) and `milestone/vX.X-slug` branches
|
||||
|
||||
@@ -191,16 +194,18 @@ IntelligenceBackend (unified interface)
|
||||
|
||||
## Current State
|
||||
|
||||
- **v0.4.0**: Backends module (OllamaLocal, OllamaCloud, Opencode), learnship references removed, verification layers migrated from .planning/ to .ci/
|
||||
- **New modules**: commit-parser (`---ci---` YAML block extraction/parsing), commit-builder (structured commit message generation), git-context (project state reconstruction from git log + branches), git-branch (phase/milestone branch lifecycle), ci-files (`.ci/` long-lived reference file management)
|
||||
- **Commit schema**: Every CI-generated commit contains a `---ci---` YAML block with phase, milestone, status, decisions, escalations, requirements, lessons, and compound metadata
|
||||
- **v0.10.0**: Ideate & Multi-Project — 3-tier ideation engine, `ciagent ideate` command, multi-project execution, `---ci--- project:` blocks, E2E tests
|
||||
- **v0.9.0**: Integration & hardening — OpenAI and Anthropic backends, all 19 agents with intrinsic mechanical logic, E2E v0.9 integration tests, parallel agent execution
|
||||
- **v0.8.0**: 11 newly-fleshed agents with mechanical methods, OpenAI/Anthropic config types, Gitea CI workflows
|
||||
- **New in v0.10**: IdeationEngine with mechanical/backend-enriched/cross-project tiers, `ciagent ideate` command with --category/--affected/--spec/--external/--cross-project/--project/--output flags, `IDEATE` pipeline stage between RESEARCH and PLAN, multi-project support with `active_projects` config and `--project all` flag, `---ci--- project: <slug>` commit blocks, `max_concurrent_projects` parallelization config
|
||||
- **New backends (v0.9)**: OpenAIBackend (gpt-4o, API key auth, OpenAI-Organization header), AnthropicBackend (Claude, API key auth, anthropic-version header, tool use translation)
|
||||
- **Config expansion (v0.10)**: `ideation` section in config with categories, thresholds, external signals, cross-project, chaos; `active_projects` array; `max_concurrent_projects` in parallelization
|
||||
- **Auto-detection order**: opencode → openai → ollama-local → ollama-cloud → anthropic
|
||||
- **All agents mechanical**: Every non-orchestrator agent (18/19) produces meaningful output without a backend — no "requires intelligence backend" stub errors
|
||||
- **Integration tests**: E2E v0.10 tests verify ideation CLI (mechanical tier), multi-project execution, all-agents-mechanical, parallel execution
|
||||
- **Pipeline stages**: SPECIFY → CLARIFY → RESEARCH → **IDEATE** → PLAN → EXECUTE → TEST → VERIFY → COMPLETE
|
||||
- **Commit schema**: Every CIAgent-generated commit contains a `---ci---` YAML block with phase, milestone, status, decisions, escalations, requirements, lessons, compound, and **project** metadata
|
||||
- **Branch strategy**: `phase/NN-slug` and `milestone/vX.X-slug` branches encode project structure; merged = complete, active = in progress
|
||||
- **Core engine rewrites**: DecisionEngine generates commit messages (not audit JSON), EscalationProtocol commits escalations as git artifacts, OrchestratorAgent uses git log as first impulse
|
||||
- **Removed**: `.ci/audit/` directory (audit trail is git log), `.planning/` directory (dynamic state derived from git history)
|
||||
- **`.ci/` contents**: `config.json`, `PROJECT.md`, `ARCHITECTURE.md`, `ROADMAP.md`, `REQUIREMENTS.md` — long-lived reference docs updated with discipline
|
||||
- **Reconstruction test**: An agent with only commit message access can reconstruct project state (phase, decisions, requirements coverage, lessons, escalations)
|
||||
- **Verification layers**: All 4 layers implemented — structural, behavioral, security (STRIDE), quality
|
||||
- **CLI**: All 11 commands wired up (`init`, `run`, `quick`, `debug`, `verify`, `review`, `status`, `audit`, `clarify`, `rollback`, `ship`)
|
||||
- **Agent implementations**: Persona loaders that delegate to active backend. Fail honestly when no backend is available (no more fake success).
|
||||
- **Intelligence backends**: OllamaLocal (LLM, localhost), OllamaCloud (LLM, remote), Opencode (Agent, --non-interactive). Auto-detection: opencode → ollama-local → ollama-cloud.
|
||||
- **Tests**: 27 test suites covering types, config, decision-engine, escalation, clarify, commit-parser, commit-builder, git-context, git-branch, ci-files, all 4 verification layers, file utils, backends, tool-registry
|
||||
- **CLI commands**: `init`, `run`, `quick`, `debug`, `verify`, `review`, `status`, `audit`, `clarify`, `rollback`, `ship`, `ideate`, `projects`
|
||||
- **Intelligence backends**: 5 options — OpenAI (LLM), Anthropic (LLM), OllamaLocal (LLM, localhost), OllamaCloud (LLM, remote), Opencode (Agent, --non-interactive). Auto-detection: opencode → openai → ollama-local → ollama-cloud → anthropic.
|
||||
- **Tests**: 58 test suites, 561 tests covering types, config, decision-engine, escalation, clarify, commit-parser, commit-builder, git-context, git-branch, ciagent-files, ideation, multi-project, all 4 verification layers, file utils, backends (ollama, openai, anthropic, opencode, tool-registry), agents (all 18 non-orchestrator), zod validation, E2E, parallel execution
|
||||
@@ -1,20 +1,34 @@
|
||||
# CI — Continuous Intelligence
|
||||
# CIAgent — Continuous Intelligence
|
||||
|
||||
Fully autonomous, git-native AI-driven software engineering harness.
|
||||
|
||||
## Overview
|
||||
|
||||
CI (Continuous Intelligence) is an autonomous-first software engineering harness that eliminates human-in-the-loop overhead while preserving the rigor of guided development. It receives a specification, resolves ambiguities through a single Clarify phase, then executes the full pipeline — research, plan, execute, verify — autonomously.
|
||||
CIAgent (Continuous Intelligence) is an autonomous-first software engineering harness that eliminates human-in-the-loop overhead while preserving the rigor of guided development. It receives a specification, resolves ambiguities through a single Clarify phase, then executes the full pipeline — research, plan, execute, verify — autonomously.
|
||||
|
||||
**The git log IS the project memory.** Every decision, escalation, lesson learned, and verification result is encoded in commit messages using structured `---ci---` YAML blocks. An agent's first impulse to gather context is `git log`, not file reads. Another agent with access to only commit messages (no code, no diffs) can reconstruct the project state completely.
|
||||
|
||||
## Intelligence Backends
|
||||
|
||||
CIAgent supports 5 intelligence backends. Set the appropriate environment variable and use `--backend` to select:
|
||||
|
||||
| Backend | Setup | Usage |
|
||||
|---------|-------|-------|
|
||||
| **OpenAI** | `export OPENAI_API_KEY=sk-...` | `ciagent run --backend openai` |
|
||||
| **Anthropic** | `export ANTHROPIC_API_KEY=sk-ant-...` | `ciagent run --backend anthropic` |
|
||||
| **Ollama Local** | `ollama serve` (localhost:11434) | `ciagent run --backend ollama-local` |
|
||||
| **Ollama Cloud** | `export OLLAMA_CLOUD_API_KEY=...` | `ciagent run --backend ollama-cloud` |
|
||||
| **Opencode** | `npm i -g opencode` | `ciagent run --backend opencode` |
|
||||
|
||||
Auto-detection (`--backend auto`, the default) tries: opencode → openai → ollama-local → ollama-cloud → anthropic.
|
||||
|
||||
## Installation
|
||||
|
||||
From source (package not yet published to npm):
|
||||
|
||||
```bash
|
||||
git clone https://git.cloudinit.dev/continuous-intelligence/ci.git
|
||||
cd ci
|
||||
cd ciagent
|
||||
npm install
|
||||
npm run build
|
||||
npm link
|
||||
@@ -24,45 +38,72 @@ npm link
|
||||
|
||||
```bash
|
||||
# Initialize from inline specification
|
||||
ci init "Build a REST API for task management"
|
||||
ciagent init "Build a REST API for task management"
|
||||
|
||||
# Initialize from a specification file
|
||||
ci init --spec ./specs/my-project.md
|
||||
ciagent init --spec ./specs/my-project.md
|
||||
|
||||
# Run the full autonomous pipeline
|
||||
ci run --all
|
||||
ciagent run --all
|
||||
|
||||
# Run a specific phase
|
||||
ci run research
|
||||
ci run plan
|
||||
ci run execute
|
||||
ci run verify
|
||||
ciagent run research
|
||||
ciagent run plan
|
||||
ciagent run execute
|
||||
ciagent run verify
|
||||
|
||||
# Run with specific backends
|
||||
ciagent run --all --backend openai
|
||||
ciagent run --all --backend anthropic
|
||||
ciagent run --all --backend ollama-local
|
||||
|
||||
# Execute an ad-hoc task
|
||||
ci quick "Add authentication middleware"
|
||||
ciagent quick "Add authentication middleware"
|
||||
|
||||
# Check project status (reads from git log + branches)
|
||||
ci status
|
||||
ciagent status
|
||||
|
||||
# Discover improvement opportunities
|
||||
ciagent ideate # Mechanical tier (always available)
|
||||
ciagent ideate --category security # Focus on specific categories
|
||||
ciagent ideate --affected # Cascade impact analysis
|
||||
ciagent ideate --spec # Specification completeness analysis
|
||||
ciagent ideate --external # npm audit + dependency staleness
|
||||
ciagent ideate --cross-project # Cross-project pattern mining
|
||||
ciagent ideate --project all # Run across all active projects
|
||||
ciagent ideate --output json # JSON output mode
|
||||
ciagent ideate --output markdown # Markdown output mode
|
||||
|
||||
# Manage multiple projects
|
||||
ciagent projects list # List all registered projects
|
||||
ciagent projects add <slug> <name> # Add a new project
|
||||
ciagent projects set <slug> # Set the active project
|
||||
|
||||
# Run with ideation stage
|
||||
ciagent run --ideate # Insert IDEATE stage between RESEARCH and PLAN
|
||||
|
||||
# Run across all active projects
|
||||
ciagent run --project all # Execute pipeline for each project
|
||||
|
||||
# Review autonomous decisions (extracted from git log ---ci--- blocks)
|
||||
ci audit
|
||||
ci audit --verbose
|
||||
ciagent audit
|
||||
ciagent audit --verbose
|
||||
|
||||
# Debug an issue
|
||||
ci debug "Tests failing on CI"
|
||||
ciagent debug "Tests failing on CI"
|
||||
|
||||
# Rollback a phase
|
||||
ci rollback 1
|
||||
ciagent rollback 1
|
||||
|
||||
# Ship a phase (verify, security, commit, tag)
|
||||
ci ship 1
|
||||
ciagent ship 1
|
||||
```
|
||||
|
||||
## Git-Native Architecture (v0.2.0)
|
||||
## Git-Native Architecture (v0.10.0)
|
||||
|
||||
### The Commit Schema
|
||||
|
||||
Every CI-generated commit contains a `---ci---` YAML block with structured metadata:
|
||||
Every CIAgent-generated commit contains a `---ci---` YAML block with structured metadata:
|
||||
|
||||
```
|
||||
feat(P01-01-02): create user registration endpoint
|
||||
@@ -92,11 +133,11 @@ requirements:
|
||||
|
||||
| Where | What | Why |
|
||||
|-------|------|-----|
|
||||
| `.ci/config.json` | Autonomy, thresholds, git strategy | Controls system behavior before any commits exist |
|
||||
| `.ci/PROJECT.md` | Vision, core value, requirements, constraints, key decisions table | Long-lived strategic reference |
|
||||
| `.ci/ARCHITECTURE.md` | System architecture, component boundaries, data flow | Long-lived technical reference |
|
||||
| `.ci/ROADMAP.md` | Phase breakdown, milestone mapping, success criteria | Long-lived planning reference |
|
||||
| `.ci/REQUIREMENTS.md` | v1/v2 requirements with REQ-IDs and traceability | Long-lived requirements reference |
|
||||
| `.ciagent/config.json` | Autonomy, thresholds, git strategy, ideation, multi-project | Controls system behavior before any commits exist |
|
||||
| `.ciagent/PROJECT.md` | Vision, core value, requirements, constraints, key decisions table | Long-lived strategic reference |
|
||||
| `.ciagent/ARCHITECTURE.md` | System architecture, component boundaries, data flow | Long-lived technical reference |
|
||||
| `.ciagent/ROADMAP.md` | Phase breakdown, milestone mapping, success criteria | Long-lived planning reference |
|
||||
| `.ciagent/REQUIREMENTS.md` | v1/v2 requirements with REQ-IDs and traceability | Long-lived requirements reference |
|
||||
| **Git commit bodies** | Decisions, escalations, lessons, compounds, verification results | Dynamic event stream — the audit trail |
|
||||
| **Git branches** | Phase/milestone status | `phase/NN-slug` and `milestone/vX.X-slug` encode project structure |
|
||||
|
||||
@@ -121,17 +162,17 @@ An agent starting a session gathers context in this order:
|
||||
1. `git log --oneline -20` — recent activity
|
||||
2. `git branch -a` — phase/milestone structure
|
||||
3. `git log -1 --format="%b"` — latest `---ci---` block
|
||||
4. `.ci/config.json` — autonomy + thresholds
|
||||
5. `.ci/PROJECT.md` — vision + constraints (when needed)
|
||||
6. `.ci/ROADMAP.md` — phase plan + success criteria (when needed)
|
||||
7. `.ci/REQUIREMENTS.md` — REQ-IDs + traceability (when planning)
|
||||
8. `.ci/ARCHITECTURE.md` — system structure (when researching)
|
||||
4. `.ciagent/config.json` — autonomy + thresholds
|
||||
5. `.ciagent/PROJECT.md` — vision + constraints (when needed)
|
||||
6. `.ciagent/ROADMAP.md` — phase plan + success criteria (when needed)
|
||||
7. `.ciagent/REQUIREMENTS.md` — REQ-IDs + traceability (when planning)
|
||||
8. `.ciagent/ARCHITECTURE.md` — system structure (when researching)
|
||||
|
||||
Steps 1-3 take <1 second and provide 80% of the context needed.
|
||||
|
||||
### The Reconstruction Test
|
||||
|
||||
An agent with access to **only commit messages** (no code, no diffs, no `.ci/` files) can reconstruct:
|
||||
An agent with access to **only commit messages** (no code, no diffs, no `.ciagent/` files) can reconstruct:
|
||||
|
||||
| Reconstructable | How |
|
||||
|---------------|-----|
|
||||
@@ -148,7 +189,7 @@ An agent with access to **only commit messages** (no code, no diffs, no `.ci/` f
|
||||
|
||||
### Commit Types
|
||||
|
||||
In addition to conventional commit types, CI uses:
|
||||
In addition to conventional commit types, CIAgent uses:
|
||||
|
||||
| Type | When Used |
|
||||
|------|-----------|
|
||||
@@ -168,7 +209,7 @@ In addition to conventional commit types, CI uses:
|
||||
|
||||
## Configuration
|
||||
|
||||
CI uses `.ci/config.json` for project configuration:
|
||||
CIAgent uses `.ciagent/config.json` for project configuration:
|
||||
|
||||
```json
|
||||
{
|
||||
@@ -185,7 +226,8 @@ CI uses `.ci/config.json` for project configuration:
|
||||
"parallelization": {
|
||||
"enabled": true,
|
||||
"max_concurrent_agents": 5,
|
||||
"min_plans_for_parallel": 2
|
||||
"min_plans_for_parallel": 2,
|
||||
"max_concurrent_projects": 3
|
||||
},
|
||||
"verification": {
|
||||
"automated_only": true,
|
||||
@@ -202,6 +244,25 @@ CI uses `.ci/config.json` for project configuration:
|
||||
"branching_strategy": "phase",
|
||||
"auto_commit": true,
|
||||
"auto_push": false
|
||||
},
|
||||
"ideation": {
|
||||
"enabled": true,
|
||||
"categories": ["security", "quality", "architecture", "coverage", "improvement"],
|
||||
"confidence_threshold": 0.6,
|
||||
"max_ideas": 20,
|
||||
"external_signals": {
|
||||
"npm_audit": true,
|
||||
"osv_advisories": true,
|
||||
"dependency_staleness": true
|
||||
},
|
||||
"cross_project": {
|
||||
"enabled": false,
|
||||
"similarity_weight": 0.5
|
||||
},
|
||||
"chaos": {
|
||||
"enabled": true,
|
||||
"scenarios": ["backend_unavailable", "requirement_change", "test_coverage_drop"]
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
@@ -211,9 +272,9 @@ CI uses `.ci/config.json` for project configuration:
|
||||
### Pipeline
|
||||
|
||||
```
|
||||
SPECIFY → CLARIFY → RESEARCH → PLAN → EXECUTE → VERIFY → COMPLETE
|
||||
↕ ↕ ↕ ↕
|
||||
(questions) (auto-decide) (auto-run) (auto-verify)
|
||||
SPECIFY → CLARIFY → RESEARCH → IDEATE → PLAN → EXECUTE → TEST → VERIFY → COMPLETE
|
||||
↕ ↕ ↕ ↕ ↕ ↕
|
||||
(questions) (auto-decide) (ideas) (auto-run) (auto-test) (auto-verify)
|
||||
```
|
||||
|
||||
### Git-Native Core Modules
|
||||
@@ -224,7 +285,7 @@ SPECIFY → CLARIFY → RESEARCH → PLAN → EXECUTE → VERIFY → COMPLETE
|
||||
| `commit-builder` | Structured commit message generation for all commit types |
|
||||
| `git-context` | Project state reconstruction from `git log` + `git branch` |
|
||||
| `git-branch` | Phase/milestone branch lifecycle management |
|
||||
| `ci-files` | `.ci/` long-lived reference file management with update discipline |
|
||||
| `ciagent-files` | `.ciagent/` long-lived reference file management with update discipline |
|
||||
|
||||
### Decision Engine
|
||||
|
||||
@@ -235,26 +296,85 @@ Every autonomous decision is classified by confidence:
|
||||
|
||||
Decisions are committed to git as `decision` type commits. The audit trail is `git log --grep="decisions:"`.
|
||||
|
||||
### 18 Agents
|
||||
### 19 Agents
|
||||
|
||||
| Agent | Role | CI Modification |
|
||||
| Agent | Role | CIAgent Modification |
|
||||
|-------|------|----------------|
|
||||
| orchestrator | Pipeline controller | Git-first context loading, `---ci---` commit generation |
|
||||
| planner | Plan creation | Never sets `autonomous: false` |
|
||||
| executor | Task execution | Never pauses for checkpoints |
|
||||
| verifier | Output verification | Generates automated tests, not human UAT |
|
||||
| researcher | Domain research | Logs assumptions, never flags for human |
|
||||
| tester | Integration/e2e tests | Detects and runs existing test files, never writes tests |
|
||||
| challenger | Plan stress-testing | Binding verdicts, only escalates <0.60 |
|
||||
| security-auditor | Security audit | Auto-dispositions threats |
|
||||
| security-auditor | Security audit | Auto-dispositions threats (STRIDE + CWE) |
|
||||
| debugger | Bug fixing | Auto-fixes when confidence > threshold |
|
||||
| Others | Various | Retained from Learnship |
|
||||
| code-reviewer | Code review | 3-persona review (security, performance, maintainability) |
|
||||
| doc-writer | Documentation | Auto-updates ROADMAP/REQUIREMENTS/PROJECT.md |
|
||||
| doc-verifier | Doc audit | Cross-checks docs vs. codebase (agent count, version, test count) |
|
||||
| ideation-agent | Improvement ideas | Feeds uncovered requirements and repeated lessons into planning |
|
||||
| roadmapper | Roadmap creation | Groups requirements by phase, generates success criteria |
|
||||
| plan-checker | Plan validation | Checks structure, IDs, must-haves, wave order, requirement coverage |
|
||||
| project-researcher | Ecosystem research | Detects frameworks, APIs, patterns, tooling from package.json |
|
||||
| research-synthesizer | Research merge | Cross-references findings across .ciagent/ documents |
|
||||
| solution-writer | Solution docs | Produces structured solution documents from plan + requirements |
|
||||
| phase-researcher | Phase research | Extracts decisions, lessons, risks from git log for a specific phase |
|
||||
|
||||
### Ideation
|
||||
|
||||
CIAgent includes a built-in ideation engine that discovers improvement opportunities from git-native signals:
|
||||
|
||||
1. **Tier 1 — Mechanical**: Mines git history for uncovered requirements, repeated lessons, low-confidence decisions, escalation patterns, coverage gaps, architecture drift, and verification inversions
|
||||
2. **Tier 2 — Backend-enriched**: When a backend is available, prioritizes mechanical findings and suggests novel improvements
|
||||
3. **Tier 3 — Cross-project**: Mines patterns from other projects in the multi-project registry
|
||||
|
||||
```
|
||||
ciagent ideate # All mechanical tiers
|
||||
ciagent ideate --category security # Security-focused ideas
|
||||
ciagent ideate --affected # Cascade impact from current changes
|
||||
ciagent ideate --spec # Specification completeness analysis
|
||||
ciagent ideate --external # npm audit + OSV advisories
|
||||
ciagent ideate --cross-project # Cross-project pattern mining
|
||||
ciagent ideate --project all # Across all active projects
|
||||
ciagent ideate --output json # Machine-readable output
|
||||
```
|
||||
|
||||
### Multi-Project
|
||||
|
||||
CIAgent supports multi-project workflows with `--project` flags:
|
||||
|
||||
```bash
|
||||
# Initialize multiple projects
|
||||
ciagent projects add task-api "Task API"
|
||||
ciagent projects add auth-svc "Auth Service"
|
||||
|
||||
# Run ideation across all projects
|
||||
ciagent ideate --project all
|
||||
|
||||
# Run pipeline for a specific project
|
||||
ciagent run --project task-api
|
||||
|
||||
# Run pipeline across all projects
|
||||
ciagent run --project all
|
||||
```
|
||||
|
||||
Commit messages include project tracking in `---ci---` blocks:
|
||||
|
||||
```
|
||||
---ci---
|
||||
phase: 5
|
||||
milestone: v0.10
|
||||
project: task-api
|
||||
status: execute
|
||||
---/ci---
|
||||
```
|
||||
|
||||
### Verification Layers
|
||||
|
||||
1. **Structural**: File existence, import/export wiring, no stubs
|
||||
2. **Behavioral**: Generated automated tests for must-haves
|
||||
3. **Security**: STRIDE analysis with auto-disposition
|
||||
4. **Code Quality**: Multi-persona review with P0 auto-fix
|
||||
2. **Behavioral**: Test execution and requirement traceability — runs test framework, parses results, reports pass/fail per suite
|
||||
3. **Security**: STRIDE threat pattern scanning with CWE mapping and confidence-based auto-disposition
|
||||
4. **Code Quality**: 3-persona code review (security, performance, maintainability) with P0/P1/P2 findings
|
||||
|
||||
## Specification Format
|
||||
|
||||
@@ -280,7 +400,7 @@ Build a REST API for task management.
|
||||
|
||||
## Escalation Protocol
|
||||
|
||||
When CI cannot proceed autonomously:
|
||||
When CIAgent cannot proceed autonomously:
|
||||
|
||||
1. **Irreversible Action**: Deploy, delete, merge to protected branch
|
||||
2. **Verification Failure**: Tests pass but functional verification fails
|
||||
@@ -292,16 +412,15 @@ Each escalation is committed as an `escalation` type commit. Resolved escalation
|
||||
|
||||
## Current Limitations
|
||||
|
||||
- **Agent implementations are stubs**: All 18 agents return success immediately. Real LLM-based agent implementations are needed for research, planning, execution, and verification.
|
||||
- **Agent implementations**: All 18 non-orchestrator agents have intrinsic mechanical logic. Full LLM-powered agent behavior requires an intelligence backend (OpenAI, Anthropic, Ollama, or Opencode).
|
||||
- **Package not published to npm**: Install from source only until a publishing pipeline is configured.
|
||||
- **Behavioral/Security/Quality verification layers**: Structural verification is fully implemented; behavioral, security, and quality layers are partially stubbed.
|
||||
|
||||
## Differences from Learnship
|
||||
|
||||
| Dimension | Learnship | CI |
|
||||
| Dimension | Learnship | CIAgent |
|
||||
|-----------|-----------|-----|
|
||||
| Project memory | `.planning/` directory files (legacy) | Git log + `---ci---` commit blocks |
|
||||
| Audit trail | `.ci/audit/*.json` files (legacy) | `git log --grep="decisions:"` |
|
||||
| Audit trail | `.ciagent/audit/*.json` files (legacy) | `git log --grep="decisions:"` |
|
||||
| State management | `STATE.md` + `STATE.md.json` (legacy) | Reconstructed from git on demand |
|
||||
| Phase discovery | Read `.planning/phases/` directory (legacy) | `git branch -a \| grep phase/` |
|
||||
| Human Interactions | 19+/lifecycle | 1-2/lifecycle |
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Stress-tests CI proposals through product and engineering lenses using forcing questions. Binding verdicts — only escalates when confidence < 0.60.
|
||||
description: Stress-tests CIAgent proposals through product and engineering lenses using forcing questions. Binding verdicts — only escalates when confidence < 0.60.
|
||||
color: "#FFA500"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,28 +9,28 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI challenger. You stress-test proposals through product and engineering lenses using forcing questions that expose weak assumptions.
|
||||
You are a CIAgent challenger. You stress-test proposals through product and engineering lenses using forcing questions that expose weak assumptions.
|
||||
|
||||
CI challengers produce binding verdicts. Only escalate when confidence < 0.60. If confident the proposal is sound, it proceeds. If confident it needs rework, it is sent back.
|
||||
CIAgent challengers produce binding verdicts. Only escalate when confidence < 0.60. If confident the proposal is sound, it proceeds. If confident it needs rework, it is sent back.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before challenging, load context from git first:
|
||||
|
||||
1. Run `git log --max-count=30` for recent decisions and project history
|
||||
2. Use GitContext.getDecisions(currentPhase) for phase decisions
|
||||
3. Read `.ci/PROJECT.md` for project vision and constraints
|
||||
4. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
3. Read `.ciagent/PROJECT.md` for project vision and constraints
|
||||
4. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
5. Use GitContext.getCompounds() for compound learnings
|
||||
</project_context>
|
||||
|
||||
@@ -44,7 +44,7 @@ Read the proposal and all git context. Extract settled decisions that should not
|
||||
|
||||
For assigned lens (product or engineering):
|
||||
1. Select 3-5 forcing questions most relevant to the proposal
|
||||
2. Answer each based on evidence from git history and .ci/ files
|
||||
2. Answer each based on evidence from git history and .ciagent/ files
|
||||
3. Note confidence level for each answer
|
||||
|
||||
### Product Lens Questions
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Reviews CI code changes through a specific persona lens (correctness, testing, security, performance, maintainability, adversarial). Auto-applies P0 fixes. Flags P1+ for post-hoc review.
|
||||
description: Reviews CIAgent code changes through a specific persona lens (correctness, testing, security, performance, maintainability, adversarial). Auto-applies P0 fixes. Flags P1+ for post-hoc review.
|
||||
color: "#FF69B4"
|
||||
tools:
|
||||
read: true
|
||||
@@ -10,20 +10,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI code reviewer. You review code changes through a specific persona lens, finding issues by severity and confidence.
|
||||
You are a CIAgent code reviewer. You review code changes through a specific persona lens, finding issues by severity and confidence.
|
||||
|
||||
CI code reviewers auto-apply P0 fixes. P1+ issues are flagged for post-hoc review via `git log --grep="review"`.
|
||||
CIAgent code reviewers auto-apply P0 fixes. P1+ issues are flagged for post-hoc review via `git log --grep="review"`.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before reviewing, load context from git first:
|
||||
@@ -31,7 +31,7 @@ Before reviewing, load context from git first:
|
||||
1. Run `git log --max-count=10` for recent changes
|
||||
2. Run `git diff HEAD~3` to see the changes being reviewed
|
||||
3. Use GitContext.getDecisions() for design decisions that explain choices
|
||||
4. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
4. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
5. Read `./AGENTS.md` for project conventions and coding standards
|
||||
</project_context>
|
||||
|
||||
|
||||
@@ -11,20 +11,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI debugger. You investigate bugs using systematic scientific method — forming hypotheses, testing them against the codebase, and finding the exact root cause.
|
||||
You are a CIAgent debugger. You investigate bugs using systematic scientific method — forming hypotheses, testing them against the codebase, and finding the exact root cause.
|
||||
|
||||
CI debuggers auto-diagnose and auto-fix when confidence > 0.60. Only low-confidence root causes are escalated to human.
|
||||
CIAgent debuggers auto-diagnose and auto-fix when confidence > 0.60. Only low-confidence root causes are escalated to human.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before debugging, load context from git first:
|
||||
@@ -33,7 +33,7 @@ Before debugging, load context from git first:
|
||||
2. Run `git diff HEAD~5` to see recent file changes
|
||||
3. Use GitContext.getDecisions() for decisions that may be relevant
|
||||
4. Read `./AGENTS.md` or `./CLAUDE.md` for project conventions
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Verifies CI documentation matches the live codebase — catches stale docs, missing sections, incorrect references. Uses git diff to detect code/doc drift.
|
||||
description: Verifies CIAgent documentation matches the live codebase — catches stale docs, missing sections, incorrect references. Uses git diff to detect code/doc drift.
|
||||
color: "#F0E68C"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,7 +9,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI doc verifier. You verify that documentation matches the live codebase by catching stale docs, missing sections, and incorrect references.
|
||||
You are a CIAgent doc verifier. You verify that documentation matches the live codebase by catching stale docs, missing sections, and incorrect references.
|
||||
|
||||
You use git diff and codebase analysis to detect drift between documentation and implementation.
|
||||
|
||||
@@ -18,18 +18,18 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before verifying, load context from git first:
|
||||
|
||||
1. Run `git diff HEAD~10` to see recent code changes
|
||||
2. Run `git log --max-count=20` for recent doc updates
|
||||
3. Read `.ci/PROJECT.md`, `.ci/ARCHITECTURE.md`, `.ci/REQUIREMENTS.md`, `.ci/ROADMAP.md`
|
||||
3. Read `.ciagent/PROJECT.md`, `.ciagent/ARCHITECTURE.md`, `.ciagent/REQUIREMENTS.md`, `.ciagent/ROADMAP.md`
|
||||
4. Read `./AGENTS.md` or `./CLAUDE.md` for project conventions
|
||||
</project_context>
|
||||
|
||||
@@ -37,7 +37,7 @@ Before verifying, load context from git first:
|
||||
|
||||
## Step 1: Load Documentation
|
||||
|
||||
Read all .ci/ documentation files. Read the codebase for actual state.
|
||||
Read all .ciagent/ documentation files. Read the codebase for actual state.
|
||||
|
||||
## Step 2: Cross-Reference
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Writes and updates CI project documentation files — grounded in the live codebase, verifies factual claims. Documentation updates are committed with ---ci--- blocks.
|
||||
description: Writes and updates CIAgent project documentation files — grounded in the live codebase, verifies factual claims. Documentation updates are committed with ---ci--- blocks.
|
||||
color: "#90EE90"
|
||||
tools:
|
||||
read: true
|
||||
@@ -11,20 +11,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI doc writer. You write and update CI project documentation files, grounded in the live codebase. You verify factual claims against actual code.
|
||||
You are a CIAgent doc writer. You write and update CIAgent project documentation files, grounded in the live codebase. You verify factual claims against actual code.
|
||||
|
||||
Documentation updates are committed with `---ci---` blocks. You update `.ci/` static files (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md) with discipline.
|
||||
Documentation updates are committed with `---ci---` blocks. You update `.ciagent/` static files (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md) with discipline.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before writing, load context from git first:
|
||||
@@ -32,7 +32,7 @@ Before writing, load context from git first:
|
||||
1. Run `git log --max-count=20` for recent changes that affect docs
|
||||
2. Use GitContext.getDecisions() for decisions to document
|
||||
3. Use GitContext.getRequirementsCoverage() for current coverage
|
||||
4. Read the existing .ci/ file you're updating
|
||||
4. Read the existing .ciagent/ file you're updating
|
||||
5. Read the relevant source code to verify claims
|
||||
</project_context>
|
||||
|
||||
@@ -51,7 +51,7 @@ Before writing any factual claim:
|
||||
|
||||
## Step 3: Write/Update Documentation
|
||||
|
||||
Use CiFiles methods to write .ci/ files:
|
||||
Use CiFiles methods to write .ciagent/ files:
|
||||
- writeProjectMd(project, reason)
|
||||
- writeArchitectureMd(architecture)
|
||||
- writeRoadmapMd(roadmap)
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Executes a single CI plan atomically — one task at a time with per-task commits and ---ci--- blocks. Never pauses for checkpoint. Creates automated verification scripts for traditionally human tasks.
|
||||
description: Executes a single CIAgent plan atomically — one task at a time with per-task commits and ---ci--- blocks. Never pauses for checkpoint. Creates automated verification scripts for traditionally human tasks.
|
||||
color: "#FFFF00"
|
||||
tools:
|
||||
read: true
|
||||
@@ -11,20 +11,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI executor. You execute plan tasks atomically — one task at a time, committing after each with `---ci---` blocks.
|
||||
You are a CIAgent executor. You execute plan tasks atomically — one task at a time, committing after each with `---ci---` blocks.
|
||||
|
||||
CI executors NEVER pause for checkpoints. Every task is autonomous. Create automated verification scripts for traditionally human tasks (manual testing, visual inspection, etc.).
|
||||
CIAgent executors NEVER pause for checkpoints. Every task is autonomous. Create automated verification scripts for traditionally human tasks (manual testing, visual inspection, etc.).
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before executing, load context from git first:
|
||||
@@ -32,8 +32,8 @@ Before executing, load context from git first:
|
||||
1. Run `git log --max-count=20` for recent project history
|
||||
2. Use GitContext.reconstructState() for current phase, milestone, stage
|
||||
3. Use GitContext.getDecisions(currentPhase) for phase decisions
|
||||
4. Read `.ci/PROJECT.md` for project constraints
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
4. Read `.ciagent/PROJECT.md` for project constraints
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
6. Read `./AGENTS.md` or `./CLAUDE.md` for project conventions
|
||||
</project_context>
|
||||
|
||||
@@ -41,7 +41,7 @@ Before executing, load context from git first:
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read the plan file. Extract wave, files_modified, autonomous (always true in CI), must_haves.
|
||||
Read the plan file. Extract wave, files_modified, autonomous (always true in CIAgent), must_haves.
|
||||
|
||||
Load git context for current state and decisions.
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Generates codebase-grounded improvement ideas through a specific thinking frame for CI. Uses git history to understand the codebase evolution.
|
||||
description: Generates codebase-grounded improvement ideas through a specific thinking frame for CIAgent. Uses git history to understand the codebase evolution.
|
||||
color: "#FFD700"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,7 +9,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI ideation agent. You generate codebase-grounded improvement ideas through a specific thinking frame. You use git history to understand the codebase evolution and identify improvement opportunities.
|
||||
You are a CIAgent ideation agent. You generate codebase-grounded improvement ideas through a specific thinking frame. You use git history to understand the codebase evolution and identify improvement opportunities.
|
||||
|
||||
You do not implement changes. You produce ideas with rationale for the orchestrator to evaluate and potentially plan.
|
||||
|
||||
@@ -18,11 +18,11 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before ideating, load context from git first:
|
||||
@@ -31,15 +31,15 @@ Before ideating, load context from git first:
|
||||
2. Use GitContext.getDecisions() for existing decisions
|
||||
3. Use GitContext.getCompounds() for compound learnings
|
||||
4. Use GitContext.getLessons() for lessons that suggest improvements
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
6. Read `.ci/REQUIREMENTS.md` for incomplete requirements
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
6. Read `.ciagent/REQUIREMENTS.md` for incomplete requirements
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read git history and .ci/ files. Understand the codebase's current state and evolution.
|
||||
Read git history and .ciagent/ files. Understand the codebase's current state and evolution.
|
||||
|
||||
## Step 2: Apply Thinking Frame
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Orchestrates the full CI pipeline by iterating through pipeline stages, loading context from the git log first, and delegating to specialized agents. The orchestrator is CI-specific — it drives the SPECIFY → CLARIFY → RESEARCH → PLAN → EXECUTE → VERIFY → COMPLETE flow.
|
||||
description: Orchestrates the full CIAgent pipeline by iterating through pipeline stages, loading context from the git log first, and delegating to specialized agents. The orchestrator is CIAgent-specific — it drives the SPECIFY → CLARIFY → RESEARCH → PLAN → EXECUTE → VERIFY → COMPLETE flow.
|
||||
color: "#00BFFF"
|
||||
tools:
|
||||
read: true
|
||||
@@ -11,9 +11,9 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are the CI orchestrator. You drive the full CI pipeline by iterating through pipeline stages, making git-first context loading decisions, and delegating to specialized agents.
|
||||
You are the CIAgent orchestrator. You drive the full CIAgent pipeline by iterating through pipeline stages, making git-first context loading decisions, and delegating to specialized agents.
|
||||
|
||||
CI operates autonomously after the clarify phase. You never pause for human checkpoints unless a decision falls below the confidence threshold or an escalation hook is triggered.
|
||||
CIAgent operates autonomously after the clarify phase. You never pause for human checkpoints unless a decision falls below the confidence threshold or an escalation hook is triggered.
|
||||
|
||||
Your job: Execute stages in order, collect PhaseResult for each, handle errors via ErrorRecovery, and produce a final project outcome.
|
||||
|
||||
@@ -22,11 +22,11 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before any operation, load project context from git first:
|
||||
@@ -37,9 +37,9 @@ Before any operation, load project context from git first:
|
||||
4. Use GitContext.getEscalations() for any pending escalations
|
||||
5. Use GitContext.getRequirementsCoverage() for covered/partial requirements
|
||||
6. Use GitContext.getLessons() for learned lessons
|
||||
7. Read `.ci/config.json` for autonomy level and parallelization settings
|
||||
8. Read `.ci/PROJECT.md` for project vision and constraints
|
||||
9. Read `.ci/ROADMAP.md` for phase breakdown and success criteria
|
||||
7. Read `.ciagent/config.json` for autonomy level and parallelization settings
|
||||
8. Read `.ciagent/PROJECT.md` for project vision and constraints
|
||||
9. Read `.ciagent/ROADMAP.md` for phase breakdown and success criteria
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Researches how to implement a CI phase well — identifies pitfalls, recommends existing solutions. Uses git history and .ci/ files as primary context sources.
|
||||
description: Researches how to implement a CIAgent phase well — identifies pitfalls, recommends existing solutions. Uses git history and .ciagent/ files as primary context sources.
|
||||
color: "#4169E1"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,20 +9,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI phase researcher. You research how to implement a phase well by identifying pitfalls, recommending existing solutions, and documenting findings.
|
||||
You are a CIAgent phase researcher. You research how to implement a phase well by identifying pitfalls, recommending existing solutions, and documenting findings.
|
||||
|
||||
You use git history and .ci/ files as primary context sources. Research is an intermediate work product — conclusions update .ci/ static files, key findings go in the commit body, decisions go in ---ci--- blocks.
|
||||
You use git history and .ciagent/ files as primary context sources. Research is an intermediate work product — conclusions update .ciagent/ static files, key findings go in the commit body, decisions go in ---ci--- blocks.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before researching, load context from git first:
|
||||
@@ -30,16 +30,16 @@ Before researching, load context from git first:
|
||||
1. Run `git log --max-count=50` for full project history
|
||||
2. Use GitContext.getDecisions() for existing decisions
|
||||
3. Use GitContext.getCompounds() for compound learnings
|
||||
4. Read `.ci/PROJECT.md` for project vision
|
||||
5. Read `.ci/REQUIREMENTS.md` for phase requirements
|
||||
6. Read `.ci/ARCHITECTURE.md` for system design
|
||||
4. Read `.ciagent/PROJECT.md` for project vision
|
||||
5. Read `.ciagent/REQUIREMENTS.md` for phase requirements
|
||||
6. Read `.ciagent/ARCHITECTURE.md` for system design
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read git history and .ci/ files. Understand the phase goal and requirements.
|
||||
Read git history and .ciagent/ files. Understand the phase goal and requirements.
|
||||
|
||||
## Step 2: Research
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Verifies CI PLAN.md files for a phase — checks goal coverage, requirement IDs, task completeness, wave correctness, and vertical slice integrity. Uses git context for validation.
|
||||
description: Verifies CIAgent PLAN.md files for a phase — checks goal coverage, requirement IDs, task completeness, wave correctness, and vertical slice integrity. Uses git context for validation.
|
||||
color: "#32CD32"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,7 +9,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI plan checker. You verify PLAN.md files for a phase by checking goal coverage, requirement IDs, task completeness, wave correctness, and vertical slice integrity.
|
||||
You are a CIAgent plan checker. You verify PLAN.md files for a phase by checking goal coverage, requirement IDs, task completeness, wave correctness, and vertical slice integrity.
|
||||
|
||||
You use git context to validate that plans align with existing decisions and don't contradict locked choices.
|
||||
|
||||
@@ -18,20 +18,20 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before checking, load context from git first:
|
||||
|
||||
1. Run `git log --max-count=20` for recent decisions affecting this phase
|
||||
2. Use GitContext.getDecisions() for locked decisions
|
||||
3. Read `.ci/ROADMAP.md` for phase goal and success criteria
|
||||
4. Read `.ci/REQUIREMENTS.md` for requirement IDs
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
3. Read `.ciagent/ROADMAP.md` for phase goal and success criteria
|
||||
4. Read `.ciagent/REQUIREMENTS.md` for requirement IDs
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Creates executable plans for a CI phase — decomposes goals into vertical slice tasks with wave-ordered dependency analysis. Never sets autonomous: false. Plans are precise prompts, not documents that become prompts.
|
||||
description: Creates executable plans for a CIAgent phase — decomposes goals into vertical slice tasks with wave-ordered dependency analysis. Never sets autonomous: false. Plans are precise prompts, not documents that become prompts.
|
||||
color: "#00FF00"
|
||||
tools:
|
||||
read: true
|
||||
@@ -10,29 +10,29 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI planner. You create executable plans for a phase by decomposing goals into atomic, independently verifiable tasks with wave-based dependency ordering.
|
||||
You are a CIAgent planner. You create executable plans for a phase by decomposing goals into atomic, independently verifiable tasks with wave-based dependency ordering.
|
||||
|
||||
CI plans NEVER have `autonomous: false`. Every task is autonomous by default. Decompose into verifiable subtasks that an executor can implement without interpretation.
|
||||
CIAgent plans NEVER have `autonomous: false`. Every task is autonomous by default. Decompose into verifiable subtasks that an executor can implement without interpretation.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before planning, load context from git first:
|
||||
|
||||
1. Run `git log --max-count=50` to see recent decisions and project history
|
||||
2. Read `.ci/PROJECT.md` for project vision and constraints
|
||||
3. Read `.ci/REQUIREMENTS.md` for requirement IDs assigned to this phase
|
||||
4. Read `.ci/ROADMAP.md` for phase goal and success criteria
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries and build order
|
||||
2. Read `.ciagent/PROJECT.md` for project vision and constraints
|
||||
3. Read `.ciagent/REQUIREMENTS.md` for requirement IDs assigned to this phase
|
||||
4. Read `.ciagent/ROADMAP.md` for phase goal and success criteria
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries and build order
|
||||
6. Use GitContext.getDecisions(currentPhase) for phase-specific decisions
|
||||
7. Use GitContext.getLessons() for lessons that affect planning
|
||||
8. Use GitContext.getCompounds() for compound learnings from past phases
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Researches the domain ecosystem for a new CI project. Produces reference files that inform roadmap creation. Uses web search and codebase analysis.
|
||||
description: Researches the domain ecosystem for a new CIAgent project. Produces reference files that inform roadmap creation. Uses web search and codebase analysis.
|
||||
color: "#4169E1"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,7 +9,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI project researcher. You research the domain ecosystem for a new CI project, producing reference files that inform roadmap creation.
|
||||
You are a CIAgent project researcher. You research the domain ecosystem for a new CI project, producing reference files that inform roadmap creation.
|
||||
|
||||
You investigate the technology stack, available features, system architecture patterns, and common pitfalls for the domain.
|
||||
|
||||
@@ -18,18 +18,18 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before researching, load context from git first:
|
||||
|
||||
1. Run `git log --max-count=20` for any prior project history
|
||||
2. Read `.ci/PROJECT.md` for project vision (if exists)
|
||||
3. Read `.ci/config.json` for project settings (if exists)
|
||||
2. Read `.ciagent/PROJECT.md` for project vision (if exists)
|
||||
3. Read `.ciagent/config.json` for project settings (if exists)
|
||||
4. Search the codebase for existing implementations to reuse
|
||||
</project_context>
|
||||
|
||||
@@ -49,7 +49,7 @@ Read the project specification. Understand what the project needs to accomplish.
|
||||
|
||||
## Step 3: Produce Reference Files
|
||||
|
||||
Update `.ci/` static files with research conclusions:
|
||||
Update `.ciagent/` static files with research conclusions:
|
||||
- PROJECT.md: project vision and requirements
|
||||
- ARCHITECTURE.md: recommended system architecture
|
||||
- REQUIREMENTS.md: formal requirements with IDs
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Synthesizes research files for CI into a cohesive summary for roadmap creation. Merges findings from stack, features, architecture, and pitfalls research.
|
||||
description: Synthesizes research files for CIAgent into a cohesive summary for roadmap creation. Merges findings from stack, features, architecture, and pitfalls research.
|
||||
color: "#87CEEB"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,28 +9,28 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI research synthesizer. You synthesize research files into a cohesive summary for roadmap creation. You merge findings from stack, features, architecture, and pitfalls research.
|
||||
You are a CIAgent research synthesizer. You synthesize research files into a cohesive summary for roadmap creation. You merge findings from stack, features, architecture, and pitfalls research.
|
||||
|
||||
You read git history and .ci/ files to understand what research has already been done, then produce a unified view.
|
||||
You read git history and .ciagent/ files to understand what research has already been done, then produce a unified view.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before synthesizing, load context from git first:
|
||||
|
||||
1. Run `git log --grep="research" --max-count=20` for prior research commits
|
||||
2. Read `.ci/PROJECT.md` for project vision
|
||||
3. Read `.ci/ARCHITECTURE.md` for architecture research
|
||||
4. Read `.ci/REQUIREMENTS.md` for requirements research
|
||||
2. Read `.ciagent/PROJECT.md` for project vision
|
||||
3. Read `.ciagent/ARCHITECTURE.md` for architecture research
|
||||
4. Read `.ciagent/REQUIREMENTS.md` for requirements research
|
||||
5. Use GitContext.getDecisions() for research-based decisions
|
||||
</project_context>
|
||||
|
||||
@@ -38,7 +38,7 @@ Before synthesizing, load context from git first:
|
||||
|
||||
## Step 1: Load All Research
|
||||
|
||||
Read all `.ci/` files and git history for research outputs. Identify the 4 research streams: stack, features, architecture, pitfalls.
|
||||
Read all `.ciagent/` files and git history for research outputs. Identify the 4 research streams: stack, features, architecture, pitfalls.
|
||||
|
||||
## Step 2: Synthesize
|
||||
|
||||
@@ -50,11 +50,11 @@ Cross-reference the research streams:
|
||||
|
||||
## Step 3: Update .ci/ Files
|
||||
|
||||
Update `.ci/` static files with synthesized conclusions. Resolve contradictions by making decisions (logged with confidence).
|
||||
Update `.ciagent/` static files with synthesized conclusions. Resolve contradictions by making decisions (logged with confidence).
|
||||
|
||||
## Step 4: Commit Synthesis
|
||||
|
||||
Commit updated .ci/ files with `---ci---` block capturing synthesis decisions.
|
||||
Commit updated .ciagent/ files with `---ci---` block capturing synthesis decisions.
|
||||
|
||||
## Step 5: Return Result
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Investigates the domain for a CI phase using git history, web search, and codebase analysis. Never flags assumptions for human validation — logs assumptions to decisions with confidence scores.
|
||||
description: Investigates the domain for a CIAgent phase using git history, web search, and codebase analysis. Never flags assumptions for human validation — logs assumptions to decisions with confidence scores.
|
||||
color: "#4169E1"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,20 +9,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI researcher. You investigate the domain for a phase using git history, web search, and codebase analysis.
|
||||
You are a CIAgent researcher. You investigate the domain for a phase using git history, web search, and codebase analysis.
|
||||
|
||||
CI researchers NEVER flag `[ASSUMED]` for human validation. Instead, log assumptions to DecisionEngine with confidence scores. Low-confidence assumptions are escalated through the normal decision flow.
|
||||
CIAgent researchers NEVER flag `[ASSUMED]` for human validation. Instead, log assumptions to DecisionEngine with confidence scores. Low-confidence assumptions are escalated through the normal decision flow.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before researching, load context from git first:
|
||||
@@ -30,16 +30,16 @@ Before researching, load context from git first:
|
||||
1. Run `git log --max-count=50` for project history and prior research
|
||||
2. Use GitContext.getDecisions() for existing decisions
|
||||
3. Use GitContext.getCompounds() for compound learnings from past phases
|
||||
4. Read `.ci/PROJECT.md` for project vision and constraints
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries
|
||||
6. Read `.ci/REQUIREMENTS.md` for requirements assigned to this phase
|
||||
4. Read `.ciagent/PROJECT.md` for project vision and constraints
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries
|
||||
6. Read `.ciagent/REQUIREMENTS.md` for requirements assigned to this phase
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read git history and .ci/ files. Extract phase requirements and existing decisions.
|
||||
Read git history and .ciagent/ files. Extract phase requirements and existing decisions.
|
||||
|
||||
## Step 2: Research Domain
|
||||
|
||||
@@ -51,7 +51,7 @@ Read git history and .ci/ files. Extract phase requirements and existing decisio
|
||||
|
||||
## Step 3: Commit Findings
|
||||
|
||||
Research conclusions update `.ci/` static files. Key findings go in the commit body. Decisions go in `---ci---` blocks:
|
||||
Research conclusions update `.ciagent/` static files. Key findings go in the commit body. Decisions go in `---ci---` blocks:
|
||||
|
||||
```
|
||||
docs(P##): research [topic]
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Creates CI project roadmaps with phase breakdown, requirement mapping, success criteria derivation, and coverage validation. Uses git history to understand project context.
|
||||
description: Creates CIAgent project roadmaps with phase breakdown, requirement mapping, success criteria derivation, and coverage validation. Uses git history to understand project context.
|
||||
color: "#20B2AA"
|
||||
tools:
|
||||
read: true
|
||||
@@ -10,7 +10,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI roadmapper. You create project roadmaps with phase breakdown, requirement mapping, success criteria derivation, and coverage validation.
|
||||
You are a CIAgent roadmapper. You create project roadmaps with phase breakdown, requirement mapping, success criteria derivation, and coverage validation.
|
||||
|
||||
You use git history to understand the project context and ensure every requirement is mapped to a phase.
|
||||
|
||||
@@ -19,27 +19,27 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before roadmapping, load context from git first:
|
||||
|
||||
1. Run `git log --max-count=30` for project history
|
||||
2. Use GitContext.getDecisions() for existing decisions
|
||||
3. Read `.ci/PROJECT.md` for project vision and constraints
|
||||
4. Read `.ci/REQUIREMENTS.md` for all requirements
|
||||
5. Read `.ci/ARCHITECTURE.md` for component boundaries and build order
|
||||
3. Read `.ciagent/PROJECT.md` for project vision and constraints
|
||||
4. Read `.ciagent/REQUIREMENTS.md` for all requirements
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for component boundaries and build order
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read git history and .ci/ files. Extract all requirements and architectural constraints.
|
||||
Read git history and .ciagent/ files. Extract all requirements and architectural constraints.
|
||||
|
||||
## Step 2: Break Into Phases
|
||||
|
||||
@@ -50,7 +50,7 @@ Read git history and .ci/ files. Extract all requirements and architectural cons
|
||||
|
||||
## Step 3: Write ROADMAP.md
|
||||
|
||||
Write `.ci/ROADMAP.md` using CiFiles.writeRoadmapMd():
|
||||
Write `.ciagent/ROADMAP.md` using CiFiles.writeRoadmapMd():
|
||||
- Overview
|
||||
- Phase list with status, dependencies, requirements, success criteria
|
||||
- Phase details section
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Verifies threat mitigation coverage for a CI phase — reads plan threat data, analyzes codebase for security concerns, classifies threats. Auto-dispositions: low=accept, medium=mitigate, high=escalate. Read-only — does not modify source code.
|
||||
description: Verifies threat mitigation coverage for a CIAgent phase — reads plan threat data, analyzes codebase for security concerns, classifies threats. Auto-dispositions: low=accept, medium=mitigate, high=escalate. Read-only — does not modify source code.
|
||||
color: "#FF0000"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,9 +9,9 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI security auditor. You verify that security threats identified during planning have been properly mitigated in the implementation.
|
||||
You are a CIAgent security auditor. You verify that security threats identified during planning have been properly mitigated in the implementation.
|
||||
|
||||
CI security auditors auto-disposition threats: low=accept, medium=mitigate, high=escalate. Only high-severity threats with no clear mitigation are escalated to human.
|
||||
CIAgent security auditors auto-disposition threats: low=accept, medium=mitigate, high=escalate. Only high-severity threats with no clear mitigation are escalated to human.
|
||||
|
||||
You are READ-ONLY. Do not modify source code.
|
||||
|
||||
@@ -20,11 +20,11 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before auditing, load context from git first:
|
||||
@@ -32,15 +32,15 @@ Before auditing, load context from git first:
|
||||
1. Run `git log --grep="security" --max-count=20` for prior security decisions
|
||||
2. Use GitContext.getDecisions(currentPhase) for phase decisions
|
||||
3. Use GitContext.getEscalations() for pending security escalations
|
||||
4. Read `.ci/config.json` for security enforcement settings
|
||||
5. Read `.ci/ARCHITECTURE.md` for trust boundaries
|
||||
4. Read `.ciagent/config.json` for security enforcement settings
|
||||
5. Read `.ciagent/ARCHITECTURE.md` for trust boundaries
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
## Step 1: Load Context
|
||||
|
||||
Read git security history and .ci/ files. Extract trust boundaries and prior threat classifications.
|
||||
Read git security history and .ciagent/ files. Extract trust boundaries and prior threat classifications.
|
||||
|
||||
## Step 2: STRIDE Analysis
|
||||
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Analyzes a recently solved CI problem and produces a structured compound learning document. Compound learnings are committed as ---ci--- blocks, not separate files.
|
||||
description: Analyzes a recently solved CIAgent problem and produces a structured compound learning document. Compound learnings are committed as ---ci--- blocks, not separate files.
|
||||
color: "#9370DB"
|
||||
tools:
|
||||
read: true
|
||||
@@ -10,7 +10,7 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI solution writer. You analyze recently solved problems and produce structured compound learning documents. Compound learnings are committed as `---ci---` blocks, not separate files.
|
||||
You are a CIAgent solution writer. You analyze recently solved problems and produce structured compound learning documents. Compound learnings are committed as `---ci---` blocks, not separate files.
|
||||
|
||||
You use git history to understand the problem context and trace the solution path.
|
||||
|
||||
@@ -19,11 +19,11 @@ If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before analyzing, load context from git first:
|
||||
@@ -31,7 +31,7 @@ Before analyzing, load context from git first:
|
||||
1. Run `git log --max-count=20` for recent problem-solving history
|
||||
2. Use GitContext.getLessons() for lessons learned
|
||||
3. Use GitContext.getCompounds() for existing compound learnings (avoid duplicates)
|
||||
4. Read `.ci/ARCHITECTURE.md` for component context
|
||||
4. Read `.ciagent/ARCHITECTURE.md` for component context
|
||||
</project_context>
|
||||
|
||||
<execution_flow>
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Verifies that a CI phase goal was actually achieved after execution — checks must_haves, requirement coverage, and integration links. Never produces human_needed unless truly unverifiable. Generates automated test scripts for unverifiable items.
|
||||
description: Verifies that a CIAgent phase goal was actually achieved after execution — checks must_haves, requirement coverage, and integration links. Never produces human_needed unless truly unverifiable. Generates automated test scripts for unverifiable items.
|
||||
color: "#800080"
|
||||
tools:
|
||||
read: true
|
||||
@@ -9,20 +9,20 @@ tools:
|
||||
---
|
||||
|
||||
<role>
|
||||
You are a CI verifier. You verify that a phase was completed correctly — not just that code was written, but that the phase goal is genuinely achieved.
|
||||
You are a CIAgent verifier. You verify that a phase was completed correctly — not just that code was written, but that the phase goal is genuinely achieved.
|
||||
|
||||
CI verifiers NEVER produce `human_needed` unless something is truly unverifiable. Generate automated test scripts for traditionally human-verified items.
|
||||
CIAgent verifiers NEVER produce `human_needed` unless something is truly unverifiable. Generate automated test scripts for traditionally human-verified items.
|
||||
|
||||
**CRITICAL: Mandatory Initial Read**
|
||||
If the prompt contains a `<files_to_read>` block, you MUST use the Read tool to load every file listed there before performing any other actions.
|
||||
</role>
|
||||
|
||||
<project_context>
|
||||
If .ci/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ci/config.json
|
||||
If .ciagent/config.json has projects[] with length > 0, you are in multi-project mode.
|
||||
- Read active_project from .ciagent/config.json
|
||||
- All commits must include `project: <active_project>` in ---ci--- block
|
||||
- Branch names are prefixed with <slug>/ in multi-project mode
|
||||
- .ci/ files are in .ci/<slug>/ subdirectories
|
||||
- .ciagent/ files are in .ciagent/<slug>/ subdirectories
|
||||
If single-project mode (projects[] empty or absent), use existing conventions.
|
||||
|
||||
Before verifying, load context from git first:
|
||||
@@ -30,8 +30,8 @@ Before verifying, load context from git first:
|
||||
1. Run `git log --grep="P##" --max-count=50` for all phase commits
|
||||
2. Use GitContext.reconstructState() for current project state
|
||||
3. Use GitContext.getRequirementsCoverage() for covered/partial requirements
|
||||
4. Read `.ci/ROADMAP.md` for phase goal and success criteria
|
||||
5. Read `.ci/REQUIREMENTS.md` for requirement IDs
|
||||
4. Read `.ciagent/ROADMAP.md` for phase goal and success criteria
|
||||
5. Read `.ciagent/REQUIREMENTS.md` for requirement IDs
|
||||
6. Use GitContext.getCommitsForPhase(currentPhase) for phase commit history
|
||||
</project_context>
|
||||
|
||||
|
||||
+1
-1
@@ -1 +1 @@
|
||||
0.5.0
|
||||
0.7.0
|
||||
@@ -1,20 +1,21 @@
|
||||
<dev_context>
|
||||
|
||||
Agent output guidance for CI dev mode. Loaded when the orchestrator operates in default (dev) mode.
|
||||
Agent output guidance for CIAgent dev mode. Loaded when the orchestrator operates in default (dev) mode.
|
||||
|
||||
---
|
||||
|
||||
## Multi-Project and NFR Versioning
|
||||
## Multi-Project and Milestone Versioning
|
||||
|
||||
When in multi-project mode (`.ci/config.json` has `projects[]` with length > 0):
|
||||
When in multi-project mode (`.ciagent/config.json` has `projects[]` with length > 0):
|
||||
- All commits include `project: <slug>` in `---ci---` block
|
||||
- Branch names are prefixed with `<slug>/`
|
||||
- `.ci/` files are in `.ci/<slug>/` subdirectories
|
||||
- `.ciagent/` files are in `.ciagent/<slug>/` subdirectories
|
||||
- Project scoping applies to all operations
|
||||
|
||||
NFR milestone versioning:
|
||||
- NFR milestones (all phases are fix/chore/docs/perf/refactor/test): progressive patch versions only, no minor tag
|
||||
- Feature milestones (any feat phase): progressive patch versions + minor milestone tag
|
||||
Milestone versioning (determined by `getMilestoneType()` before any development):
|
||||
- **NFR** (all phases: fix/chore/docs/perf/refactor/test): progressive patch versions, no milestone tag — final patch IS the deliverable
|
||||
- **Feature** (at least one `feat` phase): progressive patch versions + next minor milestone tag
|
||||
- **Major** (breaking schema changes or complete refactor): progressive minor versions per phase + major milestone tag
|
||||
|
||||
## Output Style
|
||||
|
||||
@@ -27,7 +28,7 @@ NFR milestone versioning:
|
||||
|
||||
- Working code that compiles and passes tests
|
||||
- Minimal diff — change only what is necessary
|
||||
- Commit with `---ci---` blocks for all CI-generated work
|
||||
- Commit with `---ci---` blocks for all CIAgent-generated work
|
||||
- Flag side effects or breaking changes immediately
|
||||
- Surface the next actionable step at the end of every response
|
||||
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
<research_context>
|
||||
|
||||
Agent output guidance for CI research mode. Loaded when the orchestrator operates in research mode.
|
||||
Agent output guidance for CIAgent research mode. Loaded when the orchestrator operates in research mode.
|
||||
|
||||
---
|
||||
|
||||
@@ -21,12 +21,12 @@ Agent output guidance for CI research mode. Loaded when the orchestrator operate
|
||||
|
||||
## Research Output
|
||||
|
||||
Research is intermediate work product — conclusions update `.ci/<slug>/` static files (ARCHITECTURE.md, PROJECT.md) and contain:
|
||||
Research is intermediate work product — conclusions update `.ciagent/<slug>/` static files (ARCHITECTURE.md, PROJECT.md) and contain:
|
||||
- Key findings in the commit body
|
||||
- Decisions in the `---ci---` block
|
||||
- Confidence levels for each recommendation
|
||||
|
||||
In multi-project mode, research conclusions update files in `.ci/<slug>/` subdirectories, not the root `.ci/` directory.
|
||||
In multi-project mode, research conclusions update files in `.ciagent/<slug>/` subdirectories, not the root `.ciagent/` directory.
|
||||
|
||||
## Verbosity
|
||||
|
||||
|
||||
@@ -1,12 +1,12 @@
|
||||
<review_context>
|
||||
|
||||
Agent output guidance for CI review mode. Loaded when the orchestrator operates in review mode.
|
||||
Agent output guidance for CIAgent review mode. Loaded when the orchestrator operates in review mode.
|
||||
|
||||
---
|
||||
|
||||
## Multi-Project Awareness
|
||||
|
||||
When in multi-project mode (`.ci/config.json` has `projects[]` with length > 0):
|
||||
When in multi-project mode (`.ciagent/config.json` has `projects[]` with length > 0):
|
||||
- All reviews are scoped to the active project
|
||||
- Commits include `project: <slug>` in `---ci---` blocks
|
||||
- Branch names are prefixed with `<slug>/`
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
<branch_strategy>
|
||||
|
||||
Canonical branch naming and lifecycle conventions for CI. Branches encode project structure — merged branches indicate completed work, active branches indicate work in progress.
|
||||
Canonical branch naming and lifecycle conventions for CIAgent. Branches encode project structure — merged branches indicate completed work, active branches indicate work in progress.
|
||||
|
||||
---
|
||||
|
||||
@@ -23,7 +23,7 @@ Canonical branch naming and lifecycle conventions for CI. Branches encode projec
|
||||
**Lifecycle:**
|
||||
1. Created at phase start by `GitBranch.createPhaseBranch()`
|
||||
2. All task commits for the phase land on this branch
|
||||
3. Merged to main (squash) on phase completion
|
||||
3. Merged to their milestone branch (or main if no milestone branch) on phase completion
|
||||
4. Merged = phase complete, active = phase in progress, absent = not started
|
||||
|
||||
### Milestone Branches
|
||||
@@ -42,14 +42,33 @@ Canonical branch naming and lifecycle conventions for CI. Branches encode projec
|
||||
**Lifecycle:**
|
||||
1. Created at first phase of milestone by `GitBranch.createMilestoneBranch()`
|
||||
2. Spans multiple phases within the same milestone
|
||||
3. Merged to main on milestone completion
|
||||
4. Merged = milestone complete, active = milestone in progress
|
||||
3. All phase branches merge into this branch on completion
|
||||
4. Merged to main on milestone completion
|
||||
5. Merged = milestone complete, active = milestone in progress
|
||||
|
||||
### Hotfix Branches
|
||||
|
||||
**Format:** `hotfix/description`
|
||||
|
||||
Created for urgent fixes outside the normal phase flow. Merged directly to main.
|
||||
Created for urgent fixes outside the normal phase flow. Merged directly to main (exception to hierarchy).
|
||||
|
||||
## Branch Hierarchy (Enforced)
|
||||
|
||||
```text
|
||||
main ─── milestone/vX.X-slug ─── phase/NN-slug
|
||||
|
||||
Rules:
|
||||
- Phase branches MUST merge into their milestone branch first
|
||||
- Milestone branches merge into main only after all phase branches are merged
|
||||
- If no milestone branch exists, phases may merge directly to main
|
||||
- Hotfix branches merge directly to main (exception)
|
||||
```
|
||||
|
||||
**Validation** is enforced in `GitBranch.mergePhaseBranch()` and `createShipCommand()`:
|
||||
- Phase → main: rejected if milestone branch exists for this milestone
|
||||
- Phase → milestone: allowed
|
||||
- Milestone → main: allowed only after all phase branches are merged
|
||||
- Hotfix → main: allowed
|
||||
|
||||
## Branch Status Inference
|
||||
|
||||
@@ -69,71 +88,119 @@ const branches = gitContext.getBranches();
|
||||
|
||||
## Merge Strategy
|
||||
|
||||
Default: **squash merge** into main.
|
||||
Default: **squash merge**.
|
||||
|
||||
Phase branches squash-merge into their milestone branch. Milestone branches squash-merge into main. This keeps main clean while preserving full development history in the phase branch.
|
||||
|
||||
```typescript
|
||||
gitBranch.mergePhaseBranch("phase/01-git-native-architecture", "main", true);
|
||||
// Phase → milestone (enforced when milestone branch exists)
|
||||
gitBranch.mergePhaseBranch("phase/01-git-native-architecture", "milestone/v0.5-honest-baseline", true);
|
||||
|
||||
// Milestone → main (after all phases merged)
|
||||
gitBranch.mergeMilestoneBranch("milestone/v0.5-honest-baseline", "main", true);
|
||||
```
|
||||
|
||||
Squash merge keeps main clean while preserving full development history in the phase branch. Phase branches can be deleted after merge if desired.
|
||||
Phase branches can be deleted after merge if desired.
|
||||
|
||||
## Versioning and Releases
|
||||
|
||||
**Every merge to main creates a release. No exceptions.** Versioning maps to project structure:
|
||||
**Every merge to main creates a release. No exceptions.** Versioning follows the milestone type model:
|
||||
|
||||
| Version Part | When | Example |
|
||||
|-------------|------|---------|
|
||||
| **Major** (X.0.0) | Project-level refactor or schema change | `v1.0.0` |
|
||||
| **Minor** (0.X.0) | Every milestone completion | `v0.3.0` |
|
||||
| **Patch** (0.0.X) | Every phase completion | `v0.2.3` |
|
||||
### Milestone Type and Versioning
|
||||
|
||||
### Phase completion (patch release)
|
||||
The milestone type is determined **before any development work** and governs all versioning for the entire milestone.
|
||||
|
||||
**Define semver at milestone start:** establish the version and milestone type before writing code.
|
||||
|
||||
Determine milestone type via `getMilestoneType()` which returns `"nfr" | "feature" | "major"`:
|
||||
|
||||
| Milestone Type | Condition | Phase release | Milestone release |
|
||||
|---------------|-----------|---------------|-------------------|
|
||||
| **NFR** | All phases are fix/chore/docs/perf/refactor/test | Patch — `v1.8.1`, `v1.8.2`, ... | None — final patch IS the deliverable |
|
||||
| **Feature** | At least one phase has new features (`feat`) | Patch — `v1.8.1`, `v1.8.2`, ... | Next minor — `v1.9.0` |
|
||||
| **Major** | Breaking schema changes or complete refactor | Minor — `v2.1.0`, `v2.2.0`, ... | Major — `v3.0.0` |
|
||||
|
||||
**Tag rules (CRITICAL):**
|
||||
- Milestone tags are always the NEXT version, never the base:
|
||||
- Feature: patches v0.5.1–v0.5.5 → milestone tag is v0.6.0 (NOT v0.5.0)
|
||||
- Major: minors v0.3.0, v0.4.0, v0.5.0 → milestone tag is v1.0.0
|
||||
- NFR: no milestone tag — the final patch release IS the deliverable
|
||||
- Tags must be strictly greater than all existing tags on the same major.minor line
|
||||
- NEVER create a milestone tag that is semantically below existing phase tags
|
||||
|
||||
### Phase completion
|
||||
|
||||
**NFR/Feature (patch release):**
|
||||
```bash
|
||||
git checkout main
|
||||
git merge --squash phase/01-git-native-architecture
|
||||
git commit -m "docs(P01): complete git-native-architecture phase"
|
||||
git tag -a v0.2.1 -m "v0.2.1: git-native-architecture"
|
||||
git checkout milestone/v0.5-honest-baseline # or main if no milestone branch
|
||||
git merge --squash phase/01-quick-wins
|
||||
git commit -m "docs(P01): complete quick-wins phase"
|
||||
git tag -a v0.5.1 -m "v0.5.1: quick-wins"
|
||||
git push origin main --tags
|
||||
# Create Gitea release for v0.2.1
|
||||
# Create Gitea release for v0.5.1
|
||||
```
|
||||
|
||||
Phase number within the milestone determines the patch version (1st phase = .1, 2nd phase = .2, etc.)
|
||||
|
||||
### Milestone completion (minor release)
|
||||
|
||||
**Major (minor release per phase):**
|
||||
```bash
|
||||
git checkout main
|
||||
git merge --squash milestone/v0.2-git-native
|
||||
git commit -m "docs(milestone): complete git-native"
|
||||
git tag -a v0.2.0 -m "v0.2.0: git-native"
|
||||
git checkout milestone/v0.5-schema-rewrite
|
||||
git merge --squash phase/01-core-refactor
|
||||
git commit -m "docs(P01): complete core-refactor phase"
|
||||
git tag -a v0.5.0 -m "v0.5.0: core-refactor"
|
||||
git push origin main --tags
|
||||
# Create Gitea release for v0.2.0 with full milestone summary
|
||||
# Create Gitea release for v0.5.0
|
||||
```
|
||||
|
||||
### Major release
|
||||
Each major phase bumps the minor. 1st phase = next available minor, 2nd = minor+1, etc.
|
||||
|
||||
When the project undergoes a schema-breaking change (e.g., switching from file-based to git-native architecture), bump the major version. Major releases follow the same merge → tag → release flow.
|
||||
### Milestone completion
|
||||
|
||||
## NFR Milestone Versioning
|
||||
**Feature (minor release):**
|
||||
```bash
|
||||
# All phases already merged into milestone branch
|
||||
git checkout main
|
||||
git merge --squash milestone/v0.5-honest-baseline
|
||||
git commit -m "docs(milestone): complete honest-baseline"
|
||||
git tag -a v0.6.0 -m "v0.6.0: honest-baseline" # NEXT minor, NOT v0.5.0
|
||||
git push origin main --tags
|
||||
# Create Gitea release for v0.6.0 with full milestone summary
|
||||
```
|
||||
|
||||
NFR milestones and feature milestones follow different versioning rules:
|
||||
**Major (major release):**
|
||||
```bash
|
||||
# All phases already merged into milestone branch
|
||||
git checkout main
|
||||
git merge --squash milestone/v0.5-schema-rewrite
|
||||
git commit -m "docs(milestone): complete schema-rewrite"
|
||||
git tag -a v1.0.0 -m "v1.0.0: schema-rewrite" # NEXT major
|
||||
git push origin main --tags
|
||||
# Create Gitea release for v1.0.0 with full milestone summary
|
||||
```
|
||||
|
||||
**NFR milestones** — all phases are `fix`, `chore`, `docs`, `perf`, `refactor`, or `test`:
|
||||
- Each phase gets a progressive patch version (v0.1.1, v0.1.2, v0.1.3)
|
||||
- No separate milestone tag — the milestone is implicit from the patch sequence
|
||||
- Example: milestone v0.1 with phases P01 (chore), P02 (test), P03 (perf) → v0.1.1, v0.1.2, v0.1.3
|
||||
**NFR milestones produce no milestone tag.** The last phase's patch version is the final release.
|
||||
|
||||
**Feature milestones** — any phase is `feat`:
|
||||
- Each phase gets a progressive patch version
|
||||
- On milestone completion, tag a minor version (e.g., v0.2.0)
|
||||
- Example: milestone v0.2 with phases P01 (feat), P02 (feat), P03 (fix) → v0.2.1, v0.2.2, v0.2.3 + milestone tag v0.3.0
|
||||
### Version Validation
|
||||
|
||||
Determine milestone type by checking `isNfrMilestone()` which inspects all phase commit types within the milestone.
|
||||
Before creating any tag:
|
||||
1. Tag must be strictly greater than all existing tags on the same major.minor line
|
||||
2. Milestone completion tag must be next minor (feature) or next major (major)
|
||||
3. NEVER create a tag that is semantically below existing phase tags
|
||||
|
||||
### Merge Validation Gates
|
||||
|
||||
The branch hierarchy `main > milestone/vX.X-slug > phase/NN-slug` is enforced at merge time:
|
||||
|
||||
| Merge Type | Rule | Validation |
|
||||
|------------|------|-------------|
|
||||
| Phase → Milestone | Must target milestone branch when one exists | REJECTED if milestone branch does not exist for this phase's milestone |
|
||||
| Phase → Main | Only allowed when no milestone branch exists | REJECTED if a milestone branch exists for this milestone |
|
||||
| Milestone → Main | Only after all phase branches are merged | REJECTED if any phase branches for this milestone are unmerged |
|
||||
| Hotfix → Main | Allowed (exception to hierarchy) | Always allowed |
|
||||
|
||||
## Multi-Project Branch Naming
|
||||
|
||||
When operating in multi-project mode (`.ci/config.json` has `projects[]` with length > 0):
|
||||
When operating in multi-project mode (`.ciagent/config.json` has `projects[]` with length > 0):
|
||||
|
||||
| Branch Type | Format | Example |
|
||||
|-------------|--------|---------|
|
||||
@@ -155,7 +222,7 @@ const milestones = gitBranch.listMilestones();
|
||||
|
||||
## Branch Creation Rules
|
||||
|
||||
1. Always create phase branches from main (or the current milestone branch)
|
||||
1. Always create phase branches from the current milestone branch (or main if no milestone branch exists)
|
||||
2. Never create a branch for a completed phase — it should already be merged
|
||||
3. Milestone branches span phases — don't create one per phase
|
||||
4. Use `GitBranch.createPhaseBranch()` to ensure consistent naming
|
||||
@@ -164,25 +231,35 @@ const milestones = gitBranch.listMilestones();
|
||||
## Working with Phase Branches
|
||||
|
||||
```bash
|
||||
# Create a phase branch
|
||||
git checkout -b phase/01-git-native-architecture
|
||||
# Create a milestone branch first
|
||||
git checkout main
|
||||
git checkout -b milestone/v0.5-honest-baseline
|
||||
|
||||
# Create a phase branch from the milestone
|
||||
git checkout -b phase/01-quick-wins
|
||||
|
||||
# Commit work with ---ci--- blocks
|
||||
git commit -m "feat(P01-01-01): implement commit parser
|
||||
|
||||
---ci---
|
||||
phase: 1
|
||||
milestone: v0.2
|
||||
milestone: v0.5
|
||||
plan: 01-01
|
||||
task: 01-01-01
|
||||
status: execute
|
||||
---/ci---"
|
||||
|
||||
# Merge on completion
|
||||
# Merge phase into milestone on completion
|
||||
git checkout milestone/v0.5-honest-baseline
|
||||
git merge --squash phase/01-quick-wins
|
||||
git commit -m "docs(P01): complete quick-wins phase"
|
||||
git tag -a v0.5.1 -m "v0.5.1: quick-wins"
|
||||
|
||||
# After all phases, merge milestone into main
|
||||
git checkout main
|
||||
git merge --squash phase/01-git-native-architecture
|
||||
git commit -m "docs(P01): complete git-native-architecture phase"
|
||||
git tag -a v0.2.1 -m "v0.2.1: git-native-architecture"
|
||||
git merge --squash milestone/v0.5-honest-baseline
|
||||
git commit -m "docs(milestone): complete honest-baseline"
|
||||
git tag -a v0.6.0 -m "v0.6.0: honest-baseline"
|
||||
git push origin main --tags
|
||||
```
|
||||
|
||||
|
||||
@@ -1,15 +1,15 @@
|
||||
<ci_files_discipline>
|
||||
|
||||
How CI manages the `.ci/` directory — long-lived reference documents only. Dynamic state lives in the git log via `---ci---` YAML blocks, not in files.
|
||||
How CIAgent manages the `.ciagent/` directory — long-lived reference documents only. Dynamic state lives in the git log via `---ci---` YAML blocks, not in files.
|
||||
|
||||
---
|
||||
|
||||
## Multi-Project Directory Structure
|
||||
|
||||
In multi-project mode, `.ci/` uses subdirectories per project:
|
||||
In multi-project mode, `.ciagent/` uses subdirectories per project:
|
||||
|
||||
```
|
||||
.ci/
|
||||
.ciagent/
|
||||
config.json # Registry with projects[] and active_project
|
||||
<project-slug>/
|
||||
PROJECT.md
|
||||
@@ -18,11 +18,11 @@ In multi-project mode, `.ci/` uses subdirectories per project:
|
||||
REQUIREMENTS.md
|
||||
```
|
||||
|
||||
`.ci/config.json` serves as the registry with `projects[]` (array of project entries) and `active_project` (slug of the currently active project).
|
||||
`.ciagent/config.json` serves as the registry with `projects[]` (array of project entries) and `active_project` (slug of the currently active project).
|
||||
|
||||
**Backward compatibility:** if `.ci/` has flat files (PROJECT.md, ARCHITECTURE.md, etc.) and no project subdirectories, auto-migrate by creating `<default-slug>/` and moving files into it, then updating `config.json` with a single `projects[]` entry.
|
||||
**Backward compatibility:** if `.ciagent/` has flat files (PROJECT.md, ARCHITECTURE.md, etc.) and no project subdirectories, auto-migrate by creating `<default-slug>/` and moving files into it, then updating `config.json` with a single `projects[]` entry.
|
||||
|
||||
## What Lives in `.ci/`
|
||||
## What Lives in `.ciagent/`
|
||||
|
||||
| File | Purpose | Update Frequency |
|
||||
|------|---------|-------------------|
|
||||
@@ -32,23 +32,23 @@ In multi-project mode, `.ci/` uses subdirectories per project:
|
||||
| `<slug>/ROADMAP.md` | Phase breakdown, milestone mapping, success criteria per project | Low (phase transitions) |
|
||||
| `<slug>/REQUIREMENTS.md` | v1/v2 requirements with REQ-IDs, out of scope, traceability per project | Low (requirement changes) |
|
||||
|
||||
## What Does NOT Live in `.ci/`
|
||||
## What Does NOT Live in `.ciagent/`
|
||||
|
||||
These were removed in v0.2.0 and now live in the git log:
|
||||
|
||||
| Previous Location | Now In | Access Method |
|
||||
|-------------------|--------|---------------|
|
||||
| `.ci/audit/decisions.json` | `---ci---` decisions block | `GitContext.getDecisions()` |
|
||||
| `.ci/audit/escalations.json` | `---ci---` escalations block | `GitContext.getEscalations()` |
|
||||
| `.ci/audit/lessons.json` | `---ci---` lessons block | `GitContext.getLessons()` |
|
||||
| `.ciagent/audit/decisions.json` | `---ci---` decisions block | `GitContext.getDecisions()` |
|
||||
| `.ciagent/audit/escalations.json` | `---ci---` escalations block | `GitContext.getEscalations()` |
|
||||
| `.ciagent/audit/lessons.json` | `---ci---` lessons block | `GitContext.getLessons()` |
|
||||
| `.planning/` directory (removed) | Git log + branches | `GitContext.reconstructState()` |
|
||||
|
||||
## CiFiles API
|
||||
|
||||
| Method | Returns | Purpose |
|
||||
|--------|---------|---------|
|
||||
| `ensureCIDir()` | void | Create `.ci/` if it doesn't exist |
|
||||
| `isInitialized()` | boolean | Check if `.ci/config.json` exists |
|
||||
| `ensureCIDir()` | void | Create `.ciagent/` if it doesn't exist |
|
||||
| `isInitialized()` | boolean | Check if `.ciagent/config.json` exists |
|
||||
| `readProjectMd()` | ProjectMd \| null | Read project definition |
|
||||
| `writeProjectMd(project, reason)` | void | Write project definition |
|
||||
| `readRoadmapMd()` | RoadmapMd \| null | Read roadmap |
|
||||
@@ -66,7 +66,7 @@ These were removed in v0.2.0 and now live in the git log:
|
||||
2. **Phase boundaries** — Major updates happen at phase transitions, not during task execution.
|
||||
3. **Requirements status** — Use `updateRequirementStatus()` for single-status changes, not full rewrites.
|
||||
4. **Phase status** — Use `updatePhaseStatus()` for phase transitions, not full roadmap rewrites.
|
||||
5. **Commit after write** — Every `.ci/` file change should be committed immediately with a `---ci---` block.
|
||||
5. **Commit after write** — Every `.ciagent/` file change should be committed immediately with a `---ci---` block.
|
||||
|
||||
## Update Triggers
|
||||
|
||||
@@ -157,21 +157,21 @@ interface ArchitectureMd {
|
||||
|
||||
## Research and .ci/ File Updates
|
||||
|
||||
Research is intermediate work product. Conclusions from research update `.ci/` static files:
|
||||
Research is intermediate work product. Conclusions from research update `.ciagent/` static files:
|
||||
- Key findings go in the commit body
|
||||
- Decisions go in `---ci---` blocks
|
||||
- Conclusions that change project structure update the appropriate `.ci/<slug>/` files (ARCHITECTURE.md, PROJECT.md, etc.)
|
||||
- Conclusions that change project structure update the appropriate `.ciagent/<slug>/` files (ARCHITECTURE.md, PROJECT.md, etc.)
|
||||
|
||||
Research commits are not final artifacts — they feed into planning and roadmap updates.
|
||||
|
||||
## Anti-Patterns
|
||||
|
||||
- Never write dynamic state (decisions, escalations, lessons) to `.ci/` files
|
||||
- Never update `.ci/` files during task execution — update at phase boundaries
|
||||
- Never write dynamic state (decisions, escalations, lessons) to `.ciagent/` files
|
||||
- Never update `.ciagent/` files during task execution — update at phase boundaries
|
||||
- Never skip the `reason` parameter when writing PROJECT.md
|
||||
- Never commit `.ci/` changes without a `---ci---` block
|
||||
- Never create new files in `.ci/` without updating this reference document
|
||||
- Never store counters, timestamps, or session state in `.ci/` files
|
||||
- Never store research conclusions only in commits — update `.ci/<slug>/` static files with findings
|
||||
- Never commit `.ciagent/` changes without a `---ci---` block
|
||||
- Never create new files in `.ciagent/` without updating this reference document
|
||||
- Never store counters, timestamps, or session state in `.ciagent/` files
|
||||
- Never store research conclusions only in commits — update `.ciagent/<slug>/` static files with findings
|
||||
|
||||
</ci_files_discipline>
|
||||
@@ -1,6 +1,6 @@
|
||||
<commit_schema>
|
||||
|
||||
Canonical `---ci---` YAML block schema for CI commits. Every CI-generated commit contains a structured YAML block that enables full project state reconstruction from the git log alone.
|
||||
Canonical `---ci---` YAML block schema for CIAgent commits. Every CIAgent-generated commit contains a structured YAML block that enables full project state reconstruction from the git log alone.
|
||||
|
||||
---
|
||||
|
||||
@@ -39,7 +39,7 @@ compound: # optional
|
||||
---/ci---
|
||||
```
|
||||
|
||||
The `project` field is required when in multi-project mode (`.ci/config.json` has `projects[]` with length > 0). In single-project mode, it is optional.
|
||||
The `project` field is required when in multi-project mode (`.ciagent/config.json` has `projects[]` with length > 0). In single-project mode, it is optional.
|
||||
|
||||
Example with project field:
|
||||
|
||||
@@ -104,7 +104,7 @@ The `CommitBuilder` class provides typed constructors:
|
||||
|
||||
## Reconstruction Guarantee
|
||||
|
||||
An agent with access to only commit messages (no code, no diffs, no .ci/ files) can reconstruct:
|
||||
An agent with access to only commit messages (no code, no diffs, no .ciagent/ files) can reconstruct:
|
||||
|
||||
1. **Current phase and milestone** — from the latest commit's `phase` and `milestone` fields
|
||||
2. **Pipeline stage** — from the latest commit's `status` field
|
||||
@@ -117,8 +117,8 @@ An agent with access to only commit messages (no code, no diffs, no .ci/ files)
|
||||
|
||||
## Anti-Patterns
|
||||
|
||||
- Never put CI metadata in code comments — it belongs in commit messages
|
||||
- Never omit the `---ci---` block from a CI-generated commit
|
||||
- Never put CIAgent metadata in code comments — it belongs in commit messages
|
||||
- Never omit the `---ci---` block from a CIAgent-generated commit
|
||||
- Never store decisions, escalations, or lessons in files — commit them
|
||||
- Never use a non-standard commit type — use the 14 types above
|
||||
- Never put freeform text inside the YAML block — use the structured fields
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
<decision_engine>
|
||||
|
||||
How CI makes decisions and commits them as git artifacts. The DecisionEngine uses bounded rationality with confidence thresholds to auto-decide or escalate.
|
||||
How CIAgent makes decisions and commits them as git artifacts. The DecisionEngine uses bounded rationality with confidence thresholds to auto-decide or escalate.
|
||||
|
||||
---
|
||||
|
||||
@@ -99,7 +99,7 @@ Decisions can be project-scoped via the `project` field in `---ci---` blocks. Wh
|
||||
|
||||
## Anti-Patterns
|
||||
|
||||
- Never write decisions to a `.ci/audit/` file — commit them
|
||||
- Never write decisions to a `.ciagent/audit/` file — commit them
|
||||
- Never skip recording a decision, even high-confidence ones
|
||||
- Never make a decision without listing alternatives
|
||||
- Never override the confidence threshold without explicit configuration
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
<git_context_loading>
|
||||
|
||||
How CI agents load project context. The git log IS the project memory — a CI agent's first impulse to gather context is `git log` + `git branch`, not file reads.
|
||||
How CIAgent agents load project context. The git log IS the project memory — a CIAgent agent's first impulse to gather context is `git log` + `git branch`, not file reads.
|
||||
|
||||
---
|
||||
|
||||
@@ -8,7 +8,7 @@ How CI agents load project context. The git log IS the project memory — a CI a
|
||||
|
||||
**Read the log first, files second.**
|
||||
|
||||
The git log contains every decision, escalation, lesson, and compound learning through structured `---ci---` YAML blocks. Files in `.ci/` are long-lived reference documents (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md, config.json) that change infrequently.
|
||||
The git log contains every decision, escalation, lesson, and compound learning through structured `---ci---` YAML blocks. Files in `.ciagent/` are long-lived reference documents (PROJECT.md, ARCHITECTURE.md, ROADMAP.md, REQUIREMENTS.md, config.json) that change infrequently.
|
||||
|
||||
## Context Loading Sequence
|
||||
|
||||
@@ -19,7 +19,7 @@ The git log contains every decision, escalation, lesson, and compound learning t
|
||||
5. **Requirements coverage** — `GitContext.getRequirementsCoverage()` for covered/partial
|
||||
6. **Lessons scan** — `GitContext.getLessons()` for all learned lessons
|
||||
7. **Compound learnings** — `GitContext.getCompounds()` for cross-phase patterns
|
||||
8. **File reads** — Only now read `.ci/` files (PROJECT.md, ARCHITECTURE.md, etc.)
|
||||
8. **File reads** — Only now read `.ciagent/` files (PROJECT.md, ARCHITECTURE.md, etc.)
|
||||
|
||||
## GitContext API
|
||||
|
||||
@@ -74,19 +74,19 @@ interface ParsedCiCommit {
|
||||
}
|
||||
```
|
||||
|
||||
Commits without `---ci---` blocks have `ci: null` — these are treated as non-CI commits (e.g., manual edits by the developer).
|
||||
Commits without `---ci---` blocks have `ci: null` — these are treated as non-CIAgent commits (e.g., manual edits by the developer).
|
||||
|
||||
## Phase Context Reset
|
||||
|
||||
Between phases, all state is committed to git, then the next phase starts with fresh context from git log — not accumulated conversation history.
|
||||
|
||||
**On opencode (subagent support):** spawn a fresh agent for the next phase. The new agent loads context from git log and `.ci/` files only.
|
||||
**On opencode (subagent support):** spawn a fresh agent for the next phase. The new agent loads context from git log and `.ciagent/` files only.
|
||||
|
||||
**On platforms without subagents:** simulated reset — re-read git context from scratch, ignore prior conversation history. Treat the phase boundary as a hard context boundary.
|
||||
|
||||
**Checkpoint sequence:**
|
||||
1. Commit all work from the current phase
|
||||
2. Update `.ci/` files (ROADMAP.md phase status, REQUIREMENTS.md requirement statuses)
|
||||
2. Update `.ciagent/` files (ROADMAP.md phase status, REQUIREMENTS.md requirement statuses)
|
||||
3. Verify `GitContext.reconstructState()` matches expected state
|
||||
4. Reset context — next phase begins fresh
|
||||
|
||||
@@ -112,11 +112,11 @@ When context is limited:
|
||||
2. `getDecisions(currentPhase)` — current phase decisions only
|
||||
3. `getRequirementsCoverage()` — aggregate view
|
||||
4. Skip lessons/compounds unless specifically needed
|
||||
5. Read `.ci/ROADMAP.md` instead of scanning all phase branches
|
||||
5. Read `.ciagent/ROADMAP.md` instead of scanning all phase branches
|
||||
|
||||
## What NOT to Do
|
||||
|
||||
- Never read `.ci/` files before checking the git log
|
||||
- Never read `.ciagent/` files before checking the git log
|
||||
- Never parse commit messages manually — use `CommitParser.parseCommitMessage()`
|
||||
- Never assume the latest commit reflects the current state — check branches
|
||||
- Never reconstruct state from files when git data is available
|
||||
|
||||
@@ -1,18 +1,18 @@
|
||||
---
|
||||
description: Audit CI project health — reconstruct state from git log, verify .ci/ files match codebase, check for stale references
|
||||
description: Audit CIAgent project health — reconstruct state from git log, verify .ciagent/ files match codebase, check for stale references
|
||||
---
|
||||
|
||||
# CI Audit
|
||||
# CIAgent Audit
|
||||
|
||||
Audit the CI project for health issues. Verifies that git log state matches .ci/ files and that the project can be fully reconstructed from commit messages alone.
|
||||
Audit the CIAgent project for health issues. Verifies that git log state matches .ciagent/ files and that the project can be fully reconstructed from commit messages alone.
|
||||
|
||||
**Usage:** `ci-audit`
|
||||
**Usage:** `ciagent-audit`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this audit
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- Scope audit queries to the active project
|
||||
@@ -26,16 +26,16 @@ Attempt to reconstruct the full project state from commit messages only:
|
||||
|
||||
1. Parse all `---ci---` blocks from git log
|
||||
2. Reconstruct: current phase, milestone, stage, decisions, escalations, requirements, lessons, compounds
|
||||
3. Compare reconstructed state with `.ci/` file contents
|
||||
3. Compare reconstructed state with `.ciagent/` file contents
|
||||
|
||||
## Step 2: Check .ci/ File Discipline
|
||||
|
||||
For each .ci/ file:
|
||||
- `.ci/config.json`: valid JSON, required fields present
|
||||
- `.ci/PROJECT.md`: has required sections (What This Is, Requirements, Constraints, Key Decisions)
|
||||
- `.ci/ROADMAP.md`: phases match git branches (merged = complete, active = in progress)
|
||||
- `.ci/REQUIREMENTS.md`: traceability matrix is complete
|
||||
- `.ci/ARCHITECTURE.md`: components match actual code structure
|
||||
For each .ciagent/ file:
|
||||
- `.ciagent/config.json`: valid JSON, required fields present
|
||||
- `.ciagent/PROJECT.md`: has required sections (What This Is, Requirements, Constraints, Key Decisions)
|
||||
- `.ciagent/ROADMAP.md`: phases match git branches (merged = complete, active = in progress)
|
||||
- `.ciagent/REQUIREMENTS.md`: traceability matrix is complete
|
||||
- `.ciagent/ARCHITECTURE.md`: components match actual code structure
|
||||
|
||||
## Step 3: Check Branch Hygiene
|
||||
|
||||
@@ -46,20 +46,20 @@ For each .ci/ file:
|
||||
## Step 4: Check Commit Discipline
|
||||
|
||||
- Every CI-generated commit should have a `---ci---` block
|
||||
- No stale decisions (decisions from >50 commits ago that are still in `.ci/` but not reflected in code)
|
||||
- No stale decisions (decisions from >50 commits ago that are still in `.ciagent/` but not reflected in code)
|
||||
- No unresolved escalations older than the escalation timeout
|
||||
|
||||
## Step 5: Display Report
|
||||
|
||||
```
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
CI ► AUDIT REPORT
|
||||
CIAgent ► AUDIT REPORT
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
|
||||
Reconstruction: [PASS/FAIL] — [details]
|
||||
.ci/ Files: [N] checked, [issues]
|
||||
.ciagent/ Files: [N] checked, [issues]
|
||||
Branches: [N] phase, [N] milestone, [issues]
|
||||
Commits: [N] CI commits, [N] without ---ci--- blocks
|
||||
Commits: [N] CIAgent commits, [N] without ---ci--- blocks
|
||||
|
||||
[If issues found:]
|
||||
Issues:
|
||||
|
||||
@@ -1,18 +1,18 @@
|
||||
---
|
||||
description: Clarify CI project ambiguities — generate questions, accept defaults at full autonomy, present at supervised/guided
|
||||
description: Clarify CIAgent project ambiguities — generate questions, accept defaults at full autonomy, present at supervised/guided
|
||||
---
|
||||
|
||||
# CI Clarify
|
||||
# CIAgent Clarify
|
||||
|
||||
Run the clarification phase for the current CI project. Generate questions about ambiguities, accept defaults automatically at full autonomy, or present to the user at supervised/guided levels.
|
||||
Run the clarification phase for the current CIAgent project. Generate questions about ambiguities, accept defaults automatically at full autonomy, or present to the user at supervised/guided levels.
|
||||
|
||||
**Usage:** `ci-clarify [phase_number]`
|
||||
**Usage:** `ciagent-clarify [phase_number]`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this clarification
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
@@ -26,7 +26,7 @@ git log --max-count=20
|
||||
git branch -a
|
||||
```
|
||||
|
||||
Read `.ci/PROJECT.md` and `.ci/REQUIREMENTS.md` for the specification.
|
||||
Read `.ciagent/PROJECT.md` and `.ciagent/REQUIREMENTS.md` for the specification.
|
||||
|
||||
## Step 2: Identify Ambiguities
|
||||
|
||||
@@ -75,8 +75,8 @@ decisions:
|
||||
|
||||
## Step 6: Update .ci/ Files
|
||||
|
||||
Update `.ci/PROJECT.md` with clarified requirements.
|
||||
Update `.ci/REQUIREMENTS.md` with refined requirements.
|
||||
Update `.ciagent/PROJECT.md` with clarified requirements.
|
||||
Update `.ciagent/REQUIREMENTS.md` with refined requirements.
|
||||
|
||||
## Step 7: Report
|
||||
|
||||
|
||||
@@ -1,18 +1,18 @@
|
||||
---
|
||||
description: Systematic CI debugging with git context — triage, diagnose root cause, auto-fix or escalate
|
||||
description: Systematic CIAgent debugging with git context — triage, diagnose root cause, auto-fix or escalate
|
||||
---
|
||||
|
||||
# CI Debug
|
||||
# CIAgent Debug
|
||||
|
||||
Systematic debugging workflow: triage → root cause diagnosis → auto-fix or escalate. Uses git history to find recent changes that may have caused the bug.
|
||||
|
||||
**Usage:** `ci-debug [description]`
|
||||
**Usage:** `ciagent-debug [description]`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this debug session
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- Scope debugging to the active project
|
||||
|
||||
@@ -0,0 +1,288 @@
|
||||
---
|
||||
description: Run the CIAgent ideation pipeline — analyze project for improvement opportunities, validate recommendations with user, update long-term documents
|
||||
---
|
||||
|
||||
# CIAgent Ideate
|
||||
|
||||
Run the CIAgent ideation engine to discover improvement opportunities based on git-native signals, codebase analysis, and cross-project patterns.
|
||||
|
||||
**Usage:** `ciagent ideate [options]`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine project context.
|
||||
|
||||
If `.ciagent/config.json` has `active_projects` array with length > 0:
|
||||
- Use `--project <slug>` to target a specific project
|
||||
- Use `--project all` to run ideation across all active projects (deduplicate findings)
|
||||
- If no `--project` flag, use first project in `active_projects`
|
||||
|
||||
If `.ciagent/config.json` has `active_project` string (legacy):
|
||||
- Use that project as the target
|
||||
- Backwards-compatible: if both `active_project` and `active_projects` exist, `active_projects` takes precedence
|
||||
|
||||
## Step 1: Load Project Context
|
||||
|
||||
```bash
|
||||
git log --max-count=50
|
||||
git branch -a
|
||||
```
|
||||
|
||||
Read project reference files:
|
||||
- `.ciagent/PROJECT.md` — Vision, requirements, constraints, key decisions
|
||||
- `.ciagent/ROADMAP.md` — Phases, milestones, success criteria
|
||||
- `.ciagent/REQUIREMENTS.md` — REQ-IDs, status, traceability
|
||||
- `.ciagent/ARCHITECTURE.md` — Component boundaries, data flow
|
||||
- `.ciagent/config.json` — Ideation configuration, autonomy level
|
||||
|
||||
## Step 2: Run Ideation Tiers
|
||||
|
||||
Execute tiers in order. Each tier produces `Idea[]` objects. Ideas from all tiers are merged and deduplicated before presentation.
|
||||
|
||||
### Tier 1: Mechanical Analysis (Always Available)
|
||||
|
||||
No backend required. All signals come from git history, `.ciagent/` files, and filesystem.
|
||||
|
||||
#### 2.1 Git-Native Pattern Mining
|
||||
|
||||
```bash
|
||||
git log --all --grep="lessons:" --format="%B" -50
|
||||
git log --all --grep="decisions:" --format="%B" -50 -- "***confidence***0.*"
|
||||
git log --all --grep="escalation:" --format="%B" -50
|
||||
git log --all --grep="compound:" --format="%B" -50
|
||||
```
|
||||
|
||||
Extract:
|
||||
- **Repeated lessons** — topics appearing > 1 time → systemic issue
|
||||
- **Low-confidence decisions** — confidence < 0.7 in `---ci---` blocks → improvement targets
|
||||
- **Escalation types** — each type identifies a process gap
|
||||
- **Compound solutions** — suggest generalizing patterns that were solved multiple times
|
||||
- **Partial requirements** — `requirements: partial: [REQ-XX]` in `---ci---` blocks
|
||||
|
||||
#### 2.2 Coverage Gap Analysis
|
||||
|
||||
- Parse REQUIREMENTS.md for `pending` and `in_progress` status requirements
|
||||
- Cross-reference with PLAN.md task completion
|
||||
- Identify requirements with no corresponding implementation tasks
|
||||
|
||||
#### 2.3 Verification Layer Inversion
|
||||
|
||||
For each verification layer, identify what's MISSING:
|
||||
|
||||
- **Structural**: Files referenced but not created, stubs, TODOs, placeholder implementations
|
||||
- **Behavioral**: Test suites with < 80% coverage, missing test files for covered requirements
|
||||
- **Security**: No STRIDE analysis for modified components, missing input validation patterns
|
||||
- **Quality**: P1/P2 review findings unresolved, consistent style violations
|
||||
|
||||
#### 2.4 Architectural Drift Detection
|
||||
|
||||
- Parse ARCHITECTURE.md component tree
|
||||
- Compare against actual `src/` directory structure
|
||||
- Flag components documented but not implemented
|
||||
- Flag components implemented but not documented
|
||||
- Check import graph for unauthorized dependencies between components
|
||||
|
||||
#### 2.5 Spec-Driven Improvement
|
||||
|
||||
- Analyze REQUIREMENTS.md for ambiguous language ("should" vs "must", undefined terms)
|
||||
- Check for contradictions between requirements
|
||||
- Compare against common patterns for the project type (identified from package.json keywords)
|
||||
- Flag requirements with no verification criteria
|
||||
|
||||
### Tier 2: Backend-Enriched Analysis (When LLM Available)
|
||||
|
||||
Requires an intelligence backend (opencode, openai, anthropic, or ollama).
|
||||
|
||||
#### 2.6 Prioritization and Ranking
|
||||
|
||||
- Evaluate all mechanical findings for impact and feasibility
|
||||
- Rank ideas by: (1) number of signals corroborating, (2) severity of the gap, (3) ease of addressing
|
||||
|
||||
#### 2.7 Novel Improvement Suggestions
|
||||
|
||||
- Suggest improvements beyond pattern matching (e.g., "consider rate limiting" based on industry best practices, not just a repeated lesson)
|
||||
- Generate concrete action plans for each accepted idea
|
||||
- Identify bleeding-edge approaches relevant to the project's tech stack
|
||||
|
||||
#### 2.8 Chaos Engineering Ideation
|
||||
|
||||
- Generate failure scenarios: "What if the backend is unavailable?", "What if a requirement changes mid-implementation?", "What if test coverage drops below threshold?"
|
||||
- Map failure scenarios to code that would break
|
||||
- Suggest resilience improvements for each scenario
|
||||
|
||||
### Tier 3: Cross-Project Pattern Transfer (When Multi-Project Registry Exists)
|
||||
|
||||
#### 2.9 Cross-Project Mining
|
||||
|
||||
For each project in `.ciagent/config.json` projects array:
|
||||
- Read that project's `---ci---` blocks for lessons, decisions, compound solutions
|
||||
- Find patterns relevant to the current project (same requirement area, same tech stack from package.json)
|
||||
- Suggest adaptations of lessons learned elsewhere
|
||||
- Calculate relevance score based on tech stack similarity
|
||||
|
||||
## Step 3: Merge and DeduplicateIdeas
|
||||
|
||||
Combine ideas from all tiers. Deduplicate by:
|
||||
- Same `title` strings → keep highest confidence version
|
||||
- Same `relatedReq` → merge into single idea with combined sources
|
||||
- Same `category` + overlapping domains → keep most specific
|
||||
|
||||
Sort by confidence (descending), then by number of corroborating signals.
|
||||
|
||||
## Step 4: Interactive Validation
|
||||
|
||||
Present ideas one-at-a-time to the user:
|
||||
|
||||
```
|
||||
═══ Recommendation N of M ═══
|
||||
|
||||
Category: [CATEGORY] | Confidence: [0.XX] | Tier: [mechanical/backend-enriched/cross-project]
|
||||
Title: [idea title]
|
||||
Rationale: [idea rationale]
|
||||
Related Req: [REQ-ID or "new requirement"]
|
||||
Source: [source signal type]
|
||||
|
||||
Actions:
|
||||
1. Accept (add to next milestone as new requirement)
|
||||
2. Skip
|
||||
3. Modify (edit title/rationale before accepting)
|
||||
4. Details (show full analysis including signal sources)
|
||||
```
|
||||
|
||||
For each accepted idea:
|
||||
1. Generate `IDEATE-NN` requirement ID
|
||||
2. Prompt for milestone placement (append to existing or create new)
|
||||
3. Add to REQUIREMENTS.md with status `pending`
|
||||
4. Add to ROADMAP.md next milestone
|
||||
|
||||
## Step 5: Update Long-Term Documents
|
||||
|
||||
For each accepted idea:
|
||||
|
||||
### REQUIREMENTS.md
|
||||
|
||||
Add a new row in the appropriate milestone section:
|
||||
```
|
||||
| IDEATE-NN | [idea title] | [priority] | [phase] | pending |
|
||||
```
|
||||
|
||||
### ROADMAP.md
|
||||
|
||||
Add the idea to the next milestone's phase structure:
|
||||
- If next milestone has a matching phase category, append to that phase
|
||||
- If no matching phase, suggest a new phase
|
||||
|
||||
### ARCHITECTURE.md
|
||||
|
||||
If the idea involves architectural changes, note the component change needed.
|
||||
|
||||
### PROJECT.md
|
||||
|
||||
If the idea adds new requirements or key decisions, update accordingly.
|
||||
|
||||
Commit all document updates:
|
||||
```
|
||||
decision(P##): ideation results — [N] accepted, [M] skipped
|
||||
```
|
||||
|
||||
## Step 6: Ask-After-Validation Kickoff
|
||||
|
||||
After all ideas have been validated:
|
||||
|
||||
```
|
||||
Accepted: [N] recommendations
|
||||
Skipped: [M] recommendations
|
||||
|
||||
Would you like to kick off the run workflow for these ideas? (y/n)
|
||||
```
|
||||
|
||||
If yes: Start `ciagent run` with the updated project context. The `--ideate` flag is NOT needed because the ideas are already in ROADMAP.md and REQUIREMENTS.md — the standard pipeline will pick them up.
|
||||
|
||||
If no: Output summary and exit.
|
||||
|
||||
## Command Flags
|
||||
|
||||
| Flag | Description |
|
||||
|------|-------------|
|
||||
| `--category <cats>` | Focus on specific categories: security,quality,architecture,coverage,improvement,spec,chaos (comma-separated) |
|
||||
| `--affected` | Cascade impact analysis: given current changes, what else needs updating |
|
||||
| `--spec` | Analyze specification completeness and ambiguity |
|
||||
| `--external` | Include external signals: npm audit, OSV advisories, dependency staleness |
|
||||
| `--cross-project` | Mine patterns from all projects in multi-project registry |
|
||||
| `--output <format>` | Output format: interactive (default), json, markdown |
|
||||
| `--project <slugs>` | Target project(s): slug, comma-separated, or `all` |
|
||||
| `--backend <provider>` | Override intelligence backend for enrichment tier |
|
||||
|
||||
## Pipeline Integration
|
||||
|
||||
When `ciagent run --ideate` is used, the IDEATE stage is inserted between RESEARCH and PLAN:
|
||||
|
||||
```
|
||||
SPECIFY → CLARIFY → RESEARCH → IDEATE → PLAN → EXECUTE → TEST → VERIFY → COMPLETE
|
||||
```
|
||||
|
||||
IDEATE stage commit:
|
||||
```
|
||||
---ci---
|
||||
phase: [phase-number]
|
||||
milestone: [milestone-version]
|
||||
status: ideate
|
||||
decisions:
|
||||
- id: D-XXX
|
||||
decision: "Accepted [N] ideation recommendations"
|
||||
rationale: "[summary of accepted ideas]"
|
||||
confidence: [avg confidence]
|
||||
requirements:
|
||||
covered: [IDEATE-NN, ...]
|
||||
---/ci---
|
||||
```
|
||||
|
||||
## Output Modes
|
||||
|
||||
### Interactive (default)
|
||||
|
||||
Presented one-at-a-time with accept/skip/modify actions.
|
||||
|
||||
### JSON
|
||||
|
||||
```json
|
||||
{
|
||||
"project": "[slug]",
|
||||
"milestone": "[version]",
|
||||
"ideas": [
|
||||
{
|
||||
"id": "IDEATE-NN",
|
||||
"source": "[source type]",
|
||||
"category": "[category]",
|
||||
"title": "[title]",
|
||||
"rationale": "[rationale]",
|
||||
"confidence": 0.XX,
|
||||
"relatedReq": "[REQ-ID or null]",
|
||||
"actions": ["[action types]"],
|
||||
"tier": "[mechanical/backend-enriched/cross-project]",
|
||||
"accepted": true
|
||||
}
|
||||
],
|
||||
"summary": {
|
||||
"total": 8,
|
||||
"accepted": 6,
|
||||
"skipped": 2,
|
||||
"by_category": { "coverage": 2, "architecture": 1, "security": 1, "quality": 1, "improvement": 1 }
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
### Markdown
|
||||
|
||||
Formatted report suitable for PR descriptions or documentation.
|
||||
|
||||
## Error Recovery
|
||||
|
||||
On tier failure:
|
||||
1. Mechanical tier always succeeds (git + filesystem only)
|
||||
2. Backend-enriched tier: if backend unavailable, fall back to mechanical-only output
|
||||
3. Cross-project tier: if no other projects in registry, skip silently
|
||||
|
||||
On validation failure (no ideas generated):
|
||||
- Output "No improvement ideas identified for this project."
|
||||
- Suggest `ciagent ideate --spec` for specification analysis or `--external` for external signals
|
||||
@@ -1,21 +1,21 @@
|
||||
---
|
||||
description: Initialize a new CI project — specification → clarify → create .ci/ reference files → initial commit
|
||||
description: Initialize a new CIAgent project — specification → clarify → create .ciagent/ reference files → initial commit
|
||||
---
|
||||
|
||||
# CI Init
|
||||
# CIAgent Init
|
||||
|
||||
Initialize a new CI project with specification parsing, clarification, and .ci/ reference file creation.
|
||||
Initialize a new CIAgent project with specification parsing, clarification, and .ciagent/ reference file creation.
|
||||
|
||||
**Usage:** `ci-init [description]`
|
||||
**Usage:** `ciagent-init [description]`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this initialization
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- All subsequent operations use `.ci/<slug>/` subdirectories
|
||||
- All subsequent operations use `.ciagent/<slug>/` subdirectories
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
|
||||
If single-project mode: proceed with existing conventions.
|
||||
@@ -29,12 +29,12 @@ Verify git is initialized:
|
||||
|
||||
If NO_GIT: `git init`
|
||||
|
||||
Check if `.ci/config.json` already exists:
|
||||
Check if `.ciagent/config.json` already exists:
|
||||
```bash
|
||||
[ -f .ci/config.json ] && echo "ALREADY_INITIALIZED" || echo "NEW"
|
||||
[ -f .ciagent/config.json ] && echo "ALREADY_INITIALIZED" || echo "NEW"
|
||||
```
|
||||
|
||||
If ALREADY_INITIALIZED: stop. Use `ci-status` to see project state.
|
||||
If ALREADY_INITIALIZED: stop. Use `ciagent-status` to see project state.
|
||||
|
||||
## Step 2: Parse Specification
|
||||
|
||||
@@ -59,15 +59,15 @@ Analyze the specification for ambiguities. For each ambiguity:
|
||||
|
||||
Record decisions in the `---ci---` block of the init commit.
|
||||
|
||||
## Step 4: Create .ci/ Files
|
||||
## Step 4: Create .ciagent/ Files
|
||||
|
||||
Use CiFiles to create the project structure:
|
||||
|
||||
1. `.ci/config.json` — registry with `projects[]` and `active_project`
|
||||
2. `.ci/<slug>/PROJECT.md` — vision, requirements, constraints, key decisions (or `.ci/PROJECT.md` in single-project mode)
|
||||
3. `.ci/<slug>/ARCHITECTURE.md` — system architecture (initial, may be incomplete)
|
||||
4. `.ci/<slug>/ROADMAP.md` — phase breakdown (to be refined by roadmapper)
|
||||
5. `.ci/<slug>/REQUIREMENTS.md` — formal requirements with REQ-IDs
|
||||
1. `.ciagent/config.json` — registry with `projects[]` and `active_project`
|
||||
2. `.ciagent/<slug>/PROJECT.md` — vision, requirements, constraints, key decisions (or `.ciagent/PROJECT.md` in single-project mode)
|
||||
3. `.ciagent/<slug>/ARCHITECTURE.md` — system architecture (initial, may be incomplete)
|
||||
4. `.ciagent/<slug>/ROADMAP.md` — phase breakdown (to be refined by roadmapper)
|
||||
5. `.ciagent/<slug>/REQUIREMENTS.md` — formal requirements with REQ-IDs
|
||||
|
||||
`initCI()` accepts `projectSlug` and `projectName` parameters for multi-project initialization.
|
||||
|
||||
@@ -105,6 +105,6 @@ Include `project: <slug>` in the `---ci---` block when in multi-project mode.
|
||||
|
||||
## Step 7: Done
|
||||
|
||||
Report project initialized, .ci/ files created, initial branch created.
|
||||
Report project initialized, .ciagent/ files created, initial branch created.
|
||||
|
||||
Next: `ci-run` to execute the pipeline, or `ci-quick` for ad-hoc tasks.
|
||||
Next: `ciagent-run` to execute the pipeline, or `ciagent-quick` for ad-hoc tasks.
|
||||
@@ -1,12 +1,12 @@
|
||||
---
|
||||
description: Execute an ad-hoc CI task with full agentic guarantees — git context, ---ci--- commits, optional research and verification
|
||||
description: Execute an ad-hoc CIAgent task with full agentic guarantees — git context, ---ci--- commits, optional research and verification
|
||||
---
|
||||
|
||||
# CI Quick
|
||||
# CIAgent Quick
|
||||
|
||||
Execute small, ad-hoc tasks with CI guarantees: git context loading, `---ci---` commit blocks, optional research and verification.
|
||||
Execute small, ad-hoc tasks with CIAgent guarantees: git context loading, `---ci---` commit blocks, optional research and verification.
|
||||
|
||||
**Usage:** `ci-quick [description]`
|
||||
**Usage:** `ciagent-quick [description]`
|
||||
|
||||
**Flags:**
|
||||
- `--research` — spawn a focused research agent before execution
|
||||
@@ -15,9 +15,9 @@ Execute small, ad-hoc tasks with CI guarantees: git context loading, `---ci---`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
@@ -37,7 +37,7 @@ git branch -a
|
||||
|
||||
Use GitContext.reconstructState() to understand project state.
|
||||
|
||||
Check that `.ci/config.json` exists. If missing: stop, run `ci-init` first.
|
||||
Check that `.ciagent/config.json` exists. If missing: stop, run `ciagent-init` first.
|
||||
|
||||
## Step 3: Research (only with `--research` or `--full`)
|
||||
|
||||
|
||||
@@ -1,18 +1,18 @@
|
||||
---
|
||||
description: Review CI code changes with multi-persona analysis — auto-apply P0 fixes, flag P1+ for post-hoc review
|
||||
description: Review CIAgent code changes with multi-persona analysis — auto-apply P0 fixes, flag P1+ for post-hoc review
|
||||
---
|
||||
|
||||
# CI Review
|
||||
# CIAgent Review
|
||||
|
||||
Multi-persona code review workflow. Reviews changes in the current phase, auto-applies P0 fixes, and flags P1+ issues for post-hoc review.
|
||||
|
||||
**Usage:** `ci-review [phase_number]`
|
||||
**Usage:** `ciagent-review [phase_number]`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this review
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
|
||||
@@ -1,20 +1,20 @@
|
||||
---
|
||||
description: Rollback CI phase — revert the last phase or specified phase by resetting to its pre-phase state
|
||||
description: Rollback CIAgent phase — revert the last phase or specified phase by resetting to its pre-phase state
|
||||
---
|
||||
|
||||
# CI Rollback
|
||||
# CIAgent Rollback
|
||||
|
||||
Rollback a CI phase by reverting to the state before the phase started. Uses git to find the exact commit to reset to.
|
||||
Rollback a CIAgent phase by reverting to the state before the phase started. Uses git to find the exact commit to reset to.
|
||||
|
||||
**Usage:** `ci-rollback [phase_number]`
|
||||
**Usage:** `ciagent-rollback [phase_number]`
|
||||
|
||||
If no phase specified, rolls back the current (most recent) phase.
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this rollback
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- Identify project-scoped branches (prefixed with `<slug>/`)
|
||||
@@ -71,8 +71,8 @@ git reset --hard [rollback_point]
|
||||
## Step 5: Update State
|
||||
|
||||
- Delete the phase branch (if not already removed)
|
||||
- Update `.ci/REQUIREMENTS.md` — mark phase requirements as blocked
|
||||
- Update `.ci/ROADMAP.md` — mark phase as not_started
|
||||
- Update `.ciagent/REQUIREMENTS.md` — mark phase requirements as blocked
|
||||
- Update `.ciagent/ROADMAP.md` — mark phase as not_started
|
||||
|
||||
Commit the rollback:
|
||||
|
||||
|
||||
@@ -1,24 +1,31 @@
|
||||
---
|
||||
description: Execute the full CI pipeline — research → plan → execute → verify → complete for the current or specified phase
|
||||
description: Execute the full CIAgent pipeline — research → plan → execute → verify → complete for the current or specified phase
|
||||
---
|
||||
|
||||
# CI Run
|
||||
# CIAgent Run
|
||||
|
||||
Execute the full CI pipeline from the current stage to completion. The orchestrator iterates through stages and delegates to specialized agents.
|
||||
Execute the full CIAgent pipeline from the current stage to completion. The orchestrator iterates through stages and delegates to specialized agents.
|
||||
|
||||
**Usage:** `ci-run [phase_number]`
|
||||
**Usage:** `ciagent-run [phase_number]`
|
||||
|
||||
If no phase number specified, continues from the current phase (detected from git log).
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this run
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0, or `active_projects` array exists:
|
||||
- Confirm `active_projects` is correct for this run
|
||||
- If `--project all` is specified: iterate over all projects in `active_projects`
|
||||
- If `--project <slug>` is specified: run for that project only
|
||||
- If no `--project` flag: use first project in `active_projects`
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
|
||||
For multi-project execution (`--project all`):
|
||||
- Execute pipeline for each project sequentially by default
|
||||
- When `parallelization.enabled=true`: execute projects concurrently up to `max_concurrent_agents`
|
||||
- Each project has independent phase branches and milestone tracking
|
||||
|
||||
If single-project mode: proceed with existing conventions.
|
||||
|
||||
## Step 1: Load Git Context
|
||||
@@ -36,17 +43,17 @@ Determine current state:
|
||||
|
||||
## Step 2: Pre-Flight Check
|
||||
|
||||
Verify `.ci/config.json` exists. If missing: stop, run `ci-init` first.
|
||||
Verify `.ciagent/config.json` exists. If missing: stop, run `ciagent-init` first.
|
||||
|
||||
Read `.ci/PROJECT.md` and `.ci/ROADMAP.md` for phase goals.
|
||||
Read `.ciagent/PROJECT.md` and `.ciagent/ROADMAP.md` for phase goals.
|
||||
|
||||
## Step 3: Execute Pipeline Stages
|
||||
|
||||
For each stage in order (starting from current or from `specify`):
|
||||
|
||||
### SPECIFY
|
||||
- Parse specification from `.ci/PROJECT.md`
|
||||
- Validate requirements exist in `.ci/REQUIREMENTS.md`
|
||||
- Parse specification from `.ciagent/PROJECT.md`
|
||||
- Validate requirements exist in `.ciagent/REQUIREMENTS.md`
|
||||
- Commit: `docs(init): validate specification`
|
||||
|
||||
### CLARIFY
|
||||
@@ -57,9 +64,18 @@ For each stage in order (starting from current or from `specify`):
|
||||
### RESEARCH
|
||||
- Delegate to ci-researcher
|
||||
- Research domain, ecosystem, prior art
|
||||
- Update `.ci/` static files with conclusions
|
||||
- Update `.ciagent/` static files with conclusions
|
||||
- Commit: `docs(P##): research findings`
|
||||
|
||||
### IDEATE (when --ideate flag is passed)
|
||||
- Delegate to ci-ideation-agent
|
||||
- Mine git history for patterns, analyze coverage gaps, detect drift
|
||||
- If backend available: enrich with LLM suggestions
|
||||
- If --cross-project: mine patterns from other projects
|
||||
- Present recommendations interactively (accept/skip/modify)
|
||||
- Accepted ideas update ROADMAP.md and REQUIREMENTS.md
|
||||
- Commit: `decision(P##): ideation results — [N] accepted, [M] skipped`
|
||||
|
||||
### PLAN
|
||||
- Delegate to ci-planner
|
||||
- Create vertical-slice plans with wave ordering
|
||||
@@ -81,28 +97,29 @@ For each stage in order (starting from current or from `specify`):
|
||||
- Merge phase branch into main (squash)
|
||||
- Tag with patch version (e.g., `v0.2.3` — 3rd phase in milestone v0.2)
|
||||
- Create Gitea release for the tag
|
||||
- Update `.ci/REQUIREMENTS.md` requirement statuses
|
||||
- Update `.ci/ROADMAP.md` phase status
|
||||
- Update `.ciagent/REQUIREMENTS.md` requirement statuses
|
||||
- Update `.ciagent/ROADMAP.md` phase status
|
||||
- Commit: `docs(P##): complete [phase-name] phase`
|
||||
|
||||
Versioning: Major = project-level refactor/schema change, Minor = milestone completion, Patch = every phase.
|
||||
Versioning: Major milestone = breaking schema changes, Feature milestone = milestone completion (minor), Patch = every phase.
|
||||
|
||||
## Phase Boundary Checkpoint
|
||||
|
||||
Between phases, perform a context reset:
|
||||
|
||||
1. Commit all work from the current phase
|
||||
2. Update `.ci/` files (phase status, requirement statuses)
|
||||
2. Update `.ciagent/` files (phase status, requirement statuses)
|
||||
3. Verify `GitContext.reconstructState()` matches expected state
|
||||
4. Reset context: spawn fresh agent (opencode) or re-read git context (platforms without subagents)
|
||||
5. Next phase begins with fresh context from git log only
|
||||
|
||||
## NFR Versioning Logic
|
||||
## Versioning Logic
|
||||
|
||||
Before tagging a phase completion, check `isNfrMilestone()`:
|
||||
Before tagging a phase completion, check `getMilestoneType()` which returns `"nfr" | "feature" | "major"`:
|
||||
|
||||
- **NFR milestone** (all phases are fix/chore/docs/perf/refactor/test): apply progressive patch versions (v0.1.1, v0.1.2, v0.1.3). No separate milestone tag.
|
||||
- **Feature milestone** (any feat phase): apply progressive patch versions per phase, then tag minor milestone version on completion (e.g., v0.2.0).
|
||||
- **NFR milestone** (all phases are fix/chore/docs/perf/refactor/test): apply progressive patch versions (v0.1.1, v0.1.2, v0.1.3). No separate milestone tag — the final patch IS the deliverable.
|
||||
- **Feature milestone** (at least one feat phase): apply progressive patch versions per phase, then tag next minor milestone version on completion (e.g., v0.6.0, NOT v0.5.0).
|
||||
- **Major milestone** (breaking schema changes or complete refactor): apply progressive minor versions per phase (v0.3.0, v0.4.0), then tag next major on completion (e.g., v1.0.0).
|
||||
|
||||
## Step 4: Error Recovery
|
||||
|
||||
|
||||
+181
-41
@@ -1,27 +1,51 @@
|
||||
---
|
||||
description: Ship CI phase or milestone — test, tag, release. Every phase gets a patch release. Every milestone gets a minor (or major) release. Full autopilot.
|
||||
description: Ship CIAgent phase or milestone — Full autopilot release: validate, test, merge, tag, push, release. Zero HITL
|
||||
---
|
||||
|
||||
# CI Ship
|
||||
# CIAgent Ship
|
||||
|
||||
Ship a CI phase or milestone. Every ship creates a release — no exceptions.
|
||||
Ship a CIAgent phase or milestone. Every ship creates a release — no exceptions.
|
||||
|
||||
**Versioning rule:**
|
||||
- **Major** (X.0.0): Project-level refactor or schema changes
|
||||
- **Minor** (0.X.0): Feature milestone completion only
|
||||
- **Patch** (0.0.X): Every phase completion
|
||||
**Usage:** `ciagent-ship [phase_number|milestone]`
|
||||
|
||||
**NFR versioning:**
|
||||
- NFR milestones (all phases are fix/chore/docs/perf/refactor/test): progressive patch versions only (v0.1.1, v0.1.2, v0.1.3). No minor milestone tag.
|
||||
- Feature milestones (any feat phase): progressive patch versions per phase + minor milestone tag on completion (e.g., v0.2.0).
|
||||
## Autopilot Rules
|
||||
|
||||
**Usage:** `ci-ship [phase_number|milestone]`
|
||||
These rules are **non-negotiable**. The ship workflow runs in full autopilot mode:
|
||||
|
||||
- **Zero HITL** — no confirmation prompts, no approval gates, no requests for human input. The agent executes the entire release flow autonomously.
|
||||
- **No Shortcuts** — deep validation, testing, and merge checks must all run in full. The lack of HITL is not an excuse to skip steps.
|
||||
- **Notification Only** — status updates are informational, not requests for approval. Report outcomes, never ask permission.
|
||||
- **Autonomous Loop on Failure** — if any step fails (tests, pipeline, merge conflicts), iterate autonomously until success. Do NOT ask the user for guidance on how to fix a failing test or pipeline.
|
||||
- **Branch Hierarchy Enforced** — `main > milestone/vX.X-slug > phase/NN-slug`. Phase merges into milestone, milestone merges into main. This is validated, not assumed.
|
||||
|
||||
## Milestone Type and Versioning
|
||||
|
||||
The milestone type is determined **before any development work** and governs all versioning for the entire milestone.
|
||||
|
||||
**Define semver at milestone start:** establish the version and milestone type before writing code.
|
||||
|
||||
Determine milestone type by calling `getMilestoneType()` which returns `"nfr" | "feature" | "major"`:
|
||||
|
||||
| Milestone Type | Condition | Phase release | Milestone release |
|
||||
|---------------|-----------|---------------|-------------------|
|
||||
| **NFR** | All phases are fix/chore/docs/perf/refactor/test | Patch — `v1.8.1`, `v1.8.2`, ... | None — final patch IS the deliverable |
|
||||
| **Feature** | At least one phase has new features (`feat`) | Patch — `v1.8.1`, `v1.8.2`, ... | Next minor — `v1.9.0` |
|
||||
| **Major** | Breaking schema changes or complete refactor | Minor — `v2.1.0`, `v2.2.0`, ... | Major — `v3.0.0` |
|
||||
|
||||
**Tag rules (CRITICAL):**
|
||||
|
||||
- Milestone tags are always the NEXT version, never the base:
|
||||
- Feature: patches v0.5.1–v0.5.5 → milestone tag is v0.6.0 (NOT v0.5.0)
|
||||
- Major: minors v0.3.0, v0.4.0, v0.5.0 → milestone tag is v1.0.0
|
||||
- NFR: no milestone tag — the final patch release IS the deliverable
|
||||
- Tags must be strictly greater than all existing tags on the same major.minor line
|
||||
- NEVER create a milestone tag that is semantically below existing phase tags
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this ship
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- All commit messages must include `project: <slug>` in `---ci---` block
|
||||
@@ -29,21 +53,32 @@ If `.ci/config.json` has `projects[]` with length > 0:
|
||||
|
||||
If single-project mode: proceed with existing conventions.
|
||||
|
||||
## Step 1: Pre-Flight
|
||||
## Step 1: Pre-Flight Validation
|
||||
|
||||
```bash
|
||||
git log --max-count=10
|
||||
git branch -a
|
||||
git tag -l
|
||||
```
|
||||
|
||||
Determine what is being shipped: a single phase (patch release) or an entire milestone (minor/major release).
|
||||
Determine what is being shipped: a single phase or an entire milestone.
|
||||
|
||||
Read `.ci/ROADMAP.md` to determine:
|
||||
Read `.ciagent/ROADMAP.md` to determine:
|
||||
- Current milestone version (e.g., `v0.2`)
|
||||
- Phase number within the milestone
|
||||
- Whether this is the last phase in the milestone
|
||||
|
||||
Read `.ci/config.json` for autonomy level.
|
||||
Read `.ciagent/config.json` for autonomy level.
|
||||
|
||||
**Validation gates — all must pass before proceeding:**
|
||||
|
||||
1. **Milestone type resolved** — `getMilestoneType()` must return `"nfr" | "feature" | "major"`. Stop if undefined.
|
||||
2. **Branch hierarchy correct** — phase branch exists and targets the correct parent (milestone branch, or main if no milestone branch exists).
|
||||
3. **No unmerged phase branches** — if shipping a milestone, all phase branches for this milestone must be merged into the milestone branch.
|
||||
4. **Tag sequence valid** — the computed tag must be strictly greater than all existing tags on the same major.minor line. Check with `git tag -l`.
|
||||
5. **Autonomy confirmed** — `.ciagent/config.json` autonomy level must be `full`. This is the zero-HITL enforcement point.
|
||||
|
||||
If any validation fails: stop and report. Do NOT proceed past a failed gate.
|
||||
|
||||
## Step 2: Run Tests
|
||||
|
||||
@@ -55,24 +90,97 @@ npm run build
|
||||
|
||||
If any fail: iterate autonomously until tests pass. Do NOT ask the user for guidance — debug and fix.
|
||||
|
||||
## Step 3: Compute Version
|
||||
## Step 3: Create PR and Quality Assurance
|
||||
|
||||
Determine the release version from what is being shipped. Check `isNfrMilestone()` for versioning behavior:
|
||||
**Open a Pull Request for the merge target:**
|
||||
|
||||
| What's shipping | Milestone Type | Version bump | Tag format | Example |
|
||||
|----------------|---------------|-------------|------------|---------|
|
||||
| Single phase | NFR | Patch | `vX.Y.Z` | `v0.1.3` (3rd NFR phase in milestone v0.1) |
|
||||
| Single phase | Feature | Patch | `vX.Y.Z` | `v0.2.3` (3rd phase in feature milestone v0.2) |
|
||||
| Milestone completion | NFR | Patch (last phase) | `vX.Y.Z` | `v0.1.3` (no minor tag) |
|
||||
| Milestone completion | Feature | Minor | `vX.Y.0` | `v0.3.0` (feature milestone v0.3 complete) |
|
||||
| Project refactor/schema change | Any | Major | `vX.0.0` | `v1.0.0` (breaking schema) |
|
||||
```bash
|
||||
tea pr create --base <target-branch> --head <source-branch> --title "ship: [phase-name or milestone-name]"
|
||||
```
|
||||
|
||||
Count completed phases in the current milestone to determine the patch number.
|
||||
- For a phase ship: PR from `phase/NN-slug` into `milestone/vX.Y-slug` (or `main` if no milestone branch).
|
||||
- For a milestone ship: PR from `milestone/vX.Y-slug` into `main`.
|
||||
|
||||
## Step 4: Merge Branch
|
||||
**Auto-merge configuration:**
|
||||
|
||||
### Phase ship (patch release)
|
||||
Set the PR to auto-merge upon pipeline success:
|
||||
|
||||
```bash
|
||||
tea pr merge <pr-number> --auto --squash
|
||||
```
|
||||
|
||||
**Review:**
|
||||
|
||||
Conduct a thorough autonomous review of the PR diff. Check:
|
||||
- All expected files are included
|
||||
- No unintended changes slipped in
|
||||
- No secrets or credentials in the diff
|
||||
- All `---ci---` blocks have correct metadata
|
||||
|
||||
**Finalization:**
|
||||
|
||||
- **On pipeline success:** the PR auto-merges. Proceed to Step 4.
|
||||
- **On pipeline failure:** iterate autonomously until the pipeline passes. Do NOT merge a PR with a failing pipeline. Do NOT ask for guidance.
|
||||
|
||||
**Strict rule:** Never merge a PR with a failed pipeline. No exceptions.
|
||||
|
||||
## Step 4: Compute Version
|
||||
|
||||
| What's shipping | Milestone Type | Phase release | Milestone release | Example |
|
||||
|----------------|---------------|---------------|-------------------|---------|
|
||||
| Single phase | NFR | Patch `vX.Y.Z` | N/A | v0.1.3 (3rd NFR phase) |
|
||||
| Single phase | Feature | Patch `vX.Y.Z` | N/A | v0.2.3 (3rd feature phase) |
|
||||
| Single phase | Major | Minor `vX.(Y+N).0` | N/A | v0.4.0 (2nd major phase) |
|
||||
| Milestone completion | NFR | Patch (last phase) | None | v0.1.3 (no milestone tag) |
|
||||
| Milestone completion | Feature | Last patch | Minor `vX.(Y+1).0` | v0.3.0 (NOT v0.2.0) |
|
||||
| Milestone completion | Major | Last minor | Major `v(X+1).0.0` | v1.0.0 |
|
||||
|
||||
Phase number within the milestone determines the increment:
|
||||
- NFR/Feature: 1st phase = .1, 2nd = .2, etc. (v0.5.1, v0.5.2)
|
||||
- Major: 1st phase = next minor, 2nd = minor+1, etc. (v0.3.0, v0.4.0)
|
||||
|
||||
**Tag validation (before creating ANY tag):**
|
||||
1. Tag must be strictly greater than all existing tags on the same major.minor line
|
||||
2. Milestone completion tag must be next minor (feature) or next major (major)
|
||||
3. NEVER create a milestone tag that is semantically below existing phase tags (e.g., v0.5.0 when v0.5.1 already exists)
|
||||
|
||||
## Step 5: Merge Branch
|
||||
|
||||
### Branch hierarchy: main > milestone/vX.X-slug > phase/NN-slug
|
||||
|
||||
### Merge validation gates
|
||||
|
||||
**Phase → Milestone:**
|
||||
- VALIDATED — must target milestone branch when one exists
|
||||
- REJECTED if milestone branch does not exist for this phase's milestone
|
||||
|
||||
**Phase → Main:**
|
||||
- VALIDATED — only allowed when NO milestone branch exists for this phase's milestone
|
||||
- REJECTED if a milestone branch exists for this milestone
|
||||
|
||||
**Milestone → Main:**
|
||||
- VALIDATED — only after all phase branches are merged
|
||||
- REJECTED if any phase branches for this milestone are unmerged
|
||||
|
||||
### Phase ship
|
||||
|
||||
**If milestone branch exists:**
|
||||
```bash
|
||||
git checkout milestone/vX.Y-slug
|
||||
git merge --squash phase/NN-slug
|
||||
git commit -m "docs(P##): complete [phase-name] phase
|
||||
|
||||
---ci---
|
||||
phase: [N]
|
||||
milestone: [vX.Y]
|
||||
status: complete
|
||||
requirements:
|
||||
covered: [REQ-01, REQ-02]
|
||||
partial: []
|
||||
---/ci---"
|
||||
```
|
||||
|
||||
**If no milestone branch exists (single-phase milestone):**
|
||||
```bash
|
||||
git checkout main
|
||||
git merge --squash phase/NN-slug
|
||||
@@ -88,7 +196,9 @@ requirements:
|
||||
---/ci---"
|
||||
```
|
||||
|
||||
### Milestone ship (minor/major release)
|
||||
### Milestone ship (after last phase)
|
||||
|
||||
**Validate all phase branches are merged into the milestone branch before proceeding.**
|
||||
|
||||
```bash
|
||||
git checkout main
|
||||
@@ -102,24 +212,30 @@ status: complete
|
||||
---/ci---"
|
||||
```
|
||||
|
||||
## Step 5: Tag and Push
|
||||
## Step 6: Tag and Push
|
||||
|
||||
```bash
|
||||
git tag -a vX.Y.Z -m "vX.Y.Z: [phase-name or milestone-name]"
|
||||
git push origin main --tags
|
||||
```
|
||||
|
||||
## Step 6: Create Release
|
||||
**Tag format by milestone type:**
|
||||
- NFR/Feature phase: patch format (`v0.5.1`, `v0.5.2`)
|
||||
- Major phase: minor format (`v0.3.0`, `v0.4.0`)
|
||||
- Feature milestone: next minor (`v0.6.0`, NOT `v0.5.0`)
|
||||
- Major milestone: next major (`v1.0.0`)
|
||||
|
||||
## Step 7: Create Release and Package
|
||||
|
||||
**Every ship creates a Gitea release. No exceptions.**
|
||||
|
||||
Generate release notes from git log:
|
||||
### Generate release notes
|
||||
|
||||
```bash
|
||||
git log v[previous_tag]..vX.Y.Z --oneline
|
||||
```
|
||||
|
||||
Create the release via Gitea API:
|
||||
### Create the Gitea release
|
||||
|
||||
```bash
|
||||
curl -X POST "https://git.cloudinit.dev/api/v1/repos/continuous-intelligence/ci/releases" \
|
||||
@@ -130,22 +246,45 @@ curl -X POST "https://git.cloudinit.dev/api/v1/repos/continuous-intelligence/ci/
|
||||
|
||||
For milestone releases, include a summary of all phases completed and requirements covered.
|
||||
|
||||
## Step 7: Update .ci/ Files
|
||||
### Create distribution packages
|
||||
|
||||
- Update `.ci/REQUIREMENTS.md` — mark shipped requirements as complete
|
||||
- Update `.ci/ROADMAP.md` — mark shipped phase as complete
|
||||
Use coreci to create the necessary distribution packages:
|
||||
|
||||
```bash
|
||||
coreci build --tag vX.Y.Z
|
||||
coreci package --tag vX.Y.Z
|
||||
```
|
||||
|
||||
Upload packages to the Gitea release:
|
||||
|
||||
```bash
|
||||
coreci release upload --tag vX.Y.Z --files [built-artifacts]
|
||||
```
|
||||
|
||||
### Generate documentation
|
||||
|
||||
Include release notes in the Gitea release body with:
|
||||
- Summary of changes
|
||||
- Requirements covered
|
||||
- Known issues (if any)
|
||||
- Migration notes (for major milestones)
|
||||
|
||||
## Step 8: Update .ci/ Files
|
||||
|
||||
- Update `.ciagent/REQUIREMENTS.md` — mark shipped requirements as complete
|
||||
- Update `.ciagent/ROADMAP.md` — mark shipped phase as complete
|
||||
|
||||
Commit the file updates.
|
||||
|
||||
## Step 8: Report
|
||||
## Step 9: Report
|
||||
|
||||
```
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
CI ► SHIPPED
|
||||
CIAgent ► SHIPPED
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
|
||||
Phase [N]: [name]
|
||||
Milestone: [vX.Y]
|
||||
Milestone: [vX.Y] ([nfr|feature|major])
|
||||
Version: vX.Y.Z
|
||||
Release: https://git.cloudinit.dev/continuous-intelligence/ci/releases/tag/vX.Y.Z
|
||||
Status: complete
|
||||
@@ -153,11 +292,12 @@ Status: complete
|
||||
Tests: PASS
|
||||
Typecheck: PASS
|
||||
Build: PASS
|
||||
Pipeline: PASS
|
||||
|
||||
Requirements covered: [N]
|
||||
Commits: [N]
|
||||
|
||||
[If milestone complete:]
|
||||
All phases in milestone v0.2 complete. Milestone released.
|
||||
All phases in milestone v0.2 complete. Milestone released as vX.Y.Z.
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
```
|
||||
@@ -1,18 +1,18 @@
|
||||
---
|
||||
description: Show CI project status — current phase, milestone, pipeline stage, decisions, escalations, and requirements coverage
|
||||
description: Show CIAgent project status — current phase, milestone, pipeline stage, decisions, escalations, and requirements coverage
|
||||
---
|
||||
|
||||
# CI Status
|
||||
# CIAgent Status
|
||||
|
||||
Display the current CI project status derived entirely from the git log and .ci/ files.
|
||||
Display the current CIAgent project status derived entirely from the git log and .ciagent/ files.
|
||||
|
||||
**Usage:** `ci-status`
|
||||
**Usage:** `ciagent-status`
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Show project list with active project indicator
|
||||
- Confirm `active_project` is the project to show status for
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
@@ -45,15 +45,15 @@ Collect from git log:
|
||||
## Step 3: Read .ci/ Files
|
||||
|
||||
Read:
|
||||
- `.ci/PROJECT.md` — project name and vision
|
||||
- `.ci/ROADMAP.md` — phase list with status
|
||||
- `.ci/config.json` — autonomy level
|
||||
- `.ciagent/PROJECT.md` — project name and vision
|
||||
- `.ciagent/ROADMAP.md` — phase list with status
|
||||
- `.ciagent/config.json` — autonomy level
|
||||
|
||||
## Step 4: Display Status
|
||||
|
||||
```
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
CI ► STATUS
|
||||
CIAgent ► STATUS
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
|
||||
Project: [name] [If multi-project: (active)]
|
||||
@@ -79,4 +79,4 @@ Recent commits:
|
||||
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
|
||||
```
|
||||
|
||||
If no `.ci/` directory exists: report "Project not initialized. Run ci-init first."
|
||||
If no `.ciagent/` directory exists: report "Project not initialized. Run ciagent-init first."
|
||||
@@ -1,20 +1,20 @@
|
||||
---
|
||||
description: Verify CI project deliverables against requirements — structural, behavioral, security, and quality checks
|
||||
description: Verify CIAgent project deliverables against requirements — structural, behavioral, security, and quality checks
|
||||
---
|
||||
|
||||
# CI Verify
|
||||
# CIAgent Verify
|
||||
|
||||
Run the CI verification pipeline against the current or specified phase. Four layers: structural, behavioral, security, quality.
|
||||
Run the CIAgent verification pipeline against the current or specified phase. Four layers: structural, behavioral, security, quality.
|
||||
|
||||
**Usage:** `ci-verify [phase_number]`
|
||||
**Usage:** `ciagent-verify [phase_number]`
|
||||
|
||||
If no phase specified, verifies the current phase.
|
||||
|
||||
## Step 0: Confirm Active Project
|
||||
|
||||
Check `ci listProjects()` or read `.ci/config.json` to determine if multi-project mode is active.
|
||||
Check `ci listProjects()` or read `.ciagent/config.json` to determine if multi-project mode is active.
|
||||
|
||||
If `.ci/config.json` has `projects[]` with length > 0:
|
||||
If `.ciagent/config.json` has `projects[]` with length > 0:
|
||||
- Confirm `active_project` is correct for this verification
|
||||
- If not, set it with `ci setActiveProject(<slug>)`
|
||||
- Scope verification to the active project
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Audit CI project health — reconstruct state from git log, verify .ci/ files match codebase, check for stale references
|
||||
description: Audit CIAgent project health — reconstruct state from git log, verify .ciagent/ files match codebase, check for stale references
|
||||
tools:
|
||||
read: true
|
||||
bash: true
|
||||
@@ -16,6 +16,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI audit workflow end-to-end.
|
||||
Execute the CIAgent audit workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Clarify CI project ambiguities — generate questions, accept defaults at full autonomy, present at supervised/guided
|
||||
description: Clarify CIAgent project ambiguities — generate questions, accept defaults at full autonomy, present at supervised/guided
|
||||
argument-hint: "[phase_number]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI clarify workflow end-to-end.
|
||||
Execute the CIAgent clarify workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Systematic CI debugging with git context — triage, diagnose root cause, auto-fix or escalate
|
||||
description: Systematic CIAgent debugging with git context — triage, diagnose root cause, auto-fix or escalate
|
||||
argument-hint: "[description]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI debug workflow end-to-end.
|
||||
Execute the CIAgent debug workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Initialize a new CI project — specification → clarify → create .ci/ reference files → initial commit
|
||||
description: Initialize a new CIAgent project — specification → clarify → create .ciagent/ reference files → initial commit
|
||||
argument-hint: "[description]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI init workflow end-to-end.
|
||||
Execute the CIAgent init workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Execute an ad-hoc CI task with full agentic guarantees — git context, ---ci--- commits, optional research and verification
|
||||
description: Execute an ad-hoc CIAgent task with full agentic guarantees — git context, ---ci--- commits, optional research and verification
|
||||
argument-hint: "[description] [--research] [--verify] [--full]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI quick workflow end-to-end.
|
||||
Execute the CIAgent quick workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Review CI code changes with multi-persona analysis — auto-apply P0 fixes, flag P1+ for post-hoc review
|
||||
description: Review CIAgent code changes with multi-persona analysis — auto-apply P0 fixes, flag P1+ for post-hoc review
|
||||
argument-hint: "[phase_number]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -20,6 +20,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI review workflow end-to-end.
|
||||
Execute the CIAgent review workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Rollback CI phase — revert the last phase or specified phase by resetting to its pre-phase state
|
||||
description: Rollback CIAgent phase — revert the last phase or specified phase by resetting to its pre-phase state
|
||||
argument-hint: "[phase_number]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI rollback workflow end-to-end.
|
||||
Execute the CIAgent rollback workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Execute the full CI pipeline — research → plan → execute → verify → complete
|
||||
description: Execute the full CIAgent pipeline — research → plan → execute → verify → complete
|
||||
argument-hint: "[phase_number]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -21,6 +21,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI run workflow end-to-end.
|
||||
Execute the CIAgent run workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Ship CI phase or milestone — test, commit, tag, push, release. Full autopilot: zero HITL after milestone setup
|
||||
description: Ship CIAgent phase or milestone — Full autopilot release: validate, test, merge, tag, push, release. Zero HITL
|
||||
argument-hint: "[phase_number|milestone]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -12,7 +12,7 @@ tools:
|
||||
---
|
||||
|
||||
<execution_context>
|
||||
@__OPENCODE_DIR__/ci/workflows/ship.md
|
||||
@/root/.config/opencode/ci/workflows/ship.md
|
||||
</execution_context>
|
||||
|
||||
<context>
|
||||
@@ -20,6 +20,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI ship workflow end-to-end.
|
||||
Execute the CIAgent ship workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Show CI project status — current phase, milestone, pipeline stage, decisions, escalations, and requirements coverage
|
||||
description: Show CIAgent project status — current phase, milestone, pipeline stage, decisions, escalations, and requirements coverage
|
||||
tools:
|
||||
read: true
|
||||
bash: true
|
||||
@@ -16,6 +16,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI status workflow end-to-end.
|
||||
Execute the CIAgent status workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
@@ -1,5 +1,5 @@
|
||||
---
|
||||
description: Verify CI project deliverables against requirements — structural, behavioral, security, and quality checks
|
||||
description: Verify CIAgent project deliverables against requirements — structural, behavioral, security, and quality checks
|
||||
argument-hint: "[phase_number]"
|
||||
tools:
|
||||
read: true
|
||||
@@ -20,6 +20,6 @@ Arguments: $ARGUMENTS
|
||||
</context>
|
||||
|
||||
<process>
|
||||
Execute the CI verify workflow end-to-end.
|
||||
Execute the CIAgent verify workflow end-to-end.
|
||||
Preserve all workflow gates, validations, checkpoints, and routing.
|
||||
</process>
|
||||
Generated
+5
-5
@@ -1,19 +1,19 @@
|
||||
{
|
||||
"name": "@continuous-intelligence/ci",
|
||||
"version": "0.1.0",
|
||||
"name": "@continuous-intelligence/ciagent",
|
||||
"version": "0.10.0",
|
||||
"lockfileVersion": 3,
|
||||
"requires": true,
|
||||
"packages": {
|
||||
"": {
|
||||
"name": "@continuous-intelligence/ci",
|
||||
"version": "0.1.0",
|
||||
"name": "@continuous-intelligence/ciagent",
|
||||
"version": "0.10.0",
|
||||
"license": "MIT",
|
||||
"dependencies": {
|
||||
"commander": "^12.1.0",
|
||||
"zod": "^3.23.0"
|
||||
},
|
||||
"bin": {
|
||||
"ci": "dist/cli/index.js"
|
||||
"ciagent": "dist/cli/index.js"
|
||||
},
|
||||
"devDependencies": {
|
||||
"@types/jest": "^29.5.0",
|
||||
|
||||
+20
-5
@@ -1,11 +1,11 @@
|
||||
{
|
||||
"name": "@continuous-intelligence/ci",
|
||||
"version": "0.5.0",
|
||||
"name": "@continuous-intelligence/ciagent",
|
||||
"version": "0.10.0",
|
||||
"description": "Fully autonomous AI-driven software engineering harness - Continuous Intelligence",
|
||||
"main": "dist/index.js",
|
||||
"types": "dist/index.d.ts",
|
||||
"bin": {
|
||||
"ci": "./dist/cli/index.js"
|
||||
"ciagent": "./dist/cli/index.js"
|
||||
},
|
||||
"files": [
|
||||
"dist/",
|
||||
@@ -19,14 +19,29 @@
|
||||
"dev": "ts-node src/cli.ts",
|
||||
"typecheck": "tsc --noEmit",
|
||||
"test": "jest",
|
||||
"prepublishOnly": "npm run build",
|
||||
"check-version": "node scripts/check-version.js",
|
||||
"postbuild": "node scripts/ensure-shebang.js",
|
||||
"prepublishOnly": "npm run build && node scripts/ensure-shebang.js && node scripts/check-version.js && npm test",
|
||||
"validate-pack": "node scripts/validate-pack.js",
|
||||
"install-opencode": "node scripts/postinstall.js"
|
||||
},
|
||||
"keywords": ["ci", "autonomous", "ai", "software-engineering", "agent", "multi-project"],
|
||||
"keywords": ["ciagent", "autonomous", "ai", "software-engineering", "agent", "multi-project"],
|
||||
"license": "MIT",
|
||||
"engines": {
|
||||
"node": ">=18.0.0"
|
||||
},
|
||||
"publishConfig": {
|
||||
"registry": "https://registry.npmjs.org/",
|
||||
"access": "public"
|
||||
},
|
||||
"repository": {
|
||||
"type": "git",
|
||||
"url": "https://git.cloudinit.dev/continuous-intelligence/ciagent.git"
|
||||
},
|
||||
"homepage": "https://git.cloudinit.dev/continuous-intelligence/ciagent",
|
||||
"bugs": {
|
||||
"url": "https://git.cloudinit.dev/continuous-intelligence/ciagent/issues"
|
||||
},
|
||||
"dependencies": {
|
||||
"commander": "^12.1.0",
|
||||
"zod": "^3.23.0"
|
||||
|
||||
@@ -0,0 +1,27 @@
|
||||
const fs = require("node:fs");
|
||||
const path = require("node:path");
|
||||
|
||||
const projectRoot = path.resolve(__dirname, "..");
|
||||
|
||||
const pkgPath = path.join(projectRoot, "package.json");
|
||||
const pkg = JSON.parse(fs.readFileSync(pkgPath, "utf-8"));
|
||||
const pkgVersion = pkg.version;
|
||||
|
||||
const versionPath = path.join(projectRoot, "src", "version.ts");
|
||||
const versionContent = fs.readFileSync(versionPath, "utf-8");
|
||||
const match = versionContent.match(/VERSION\s*=\s*"([^"]+)"/);
|
||||
|
||||
if (!match) {
|
||||
console.error(`Error: Could not extract VERSION from src/version.ts`);
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
const srcVersion = match[1];
|
||||
|
||||
if (pkgVersion !== srcVersion) {
|
||||
console.error(`Error: Version mismatch — package.json=${pkgVersion}, src/version.ts=${srcVersion}`);
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
console.log(`Version consistency check passed: ${pkgVersion}`);
|
||||
process.exit(0);
|
||||
@@ -0,0 +1,23 @@
|
||||
const fs = require("node:fs");
|
||||
const path = require("node:path");
|
||||
|
||||
const projectRoot = path.resolve(__dirname, "..");
|
||||
const cliEntry = path.join(projectRoot, "dist", "cli", "index.js");
|
||||
const shebang = "#!/usr/bin/env node\n";
|
||||
|
||||
if (!fs.existsSync(cliEntry)) {
|
||||
console.log(`dist/cli/index.js not found — skipping shebang check (build may not have run yet)`);
|
||||
process.exit(0);
|
||||
}
|
||||
|
||||
const content = fs.readFileSync(cliEntry, "utf-8");
|
||||
|
||||
if (content.startsWith(shebang.trim())) {
|
||||
console.log("Shebang already present in dist/cli/index.js");
|
||||
process.exit(0);
|
||||
}
|
||||
|
||||
const updated = shebang + content;
|
||||
fs.writeFileSync(cliEntry, updated, "utf-8");
|
||||
console.log("Prepended shebang to dist/cli/index.js");
|
||||
process.exit(0);
|
||||
Regular → Executable
+15
-15
@@ -14,9 +14,9 @@ for arg in "$@"; do
|
||||
--help|-h)
|
||||
echo "Usage: $(basename "$0") [--uninstall] [--force]"
|
||||
echo ""
|
||||
echo "Install CI opencode integration files to ~/.config/opencode/"
|
||||
echo "Install CIAgent opencode integration files to ~/.config/opencode/"
|
||||
echo ""
|
||||
echo " --uninstall Remove CI integration files"
|
||||
echo " --uninstall Remove CIAgent integration files"
|
||||
echo " --force Overwrite existing files without prompting"
|
||||
echo " --help Show this help"
|
||||
exit 0
|
||||
@@ -25,24 +25,24 @@ for arg in "$@"; do
|
||||
done
|
||||
|
||||
if [ "$UNINSTALL" = true ]; then
|
||||
echo "Uninstalling CI opencode integration..."
|
||||
|
||||
rm -f "${OPENCODE_DIR}/agents/ci-"*.md 2>/dev/null || true
|
||||
rm -f "${OPENCODE_DIR}/command/ci-"*.md 2>/dev/null || true
|
||||
rm -rf "${OPENCODE_DIR}/ci/" 2>/dev/null || true
|
||||
|
||||
echo "CI integration files removed."
|
||||
echo "Uninstalling CIAgent opencode integration..."
|
||||
|
||||
rm -f "${OPENCODE_DIR}/agents/ci-"*.md 2>/dev/null || true
|
||||
rm -f "${OPENCODE_DIR}/command/ci-"*.md 2>/dev/null || true
|
||||
rm -rf "${OPENCODE_DIR}/ci/" 2>/dev/null || true
|
||||
|
||||
echo "CIAgent integration files removed."
|
||||
echo "Note: opencode.json permissions entry preserved (edit manually if needed)."
|
||||
exit 0
|
||||
fi
|
||||
|
||||
if [ ! -d "$CI_DIR" ]; then
|
||||
echo "Error: opencode/ directory not found at ${CI_DIR}"
|
||||
echo "Ensure you're running from the CI repository root."
|
||||
echo "Ensure you're running from the CIAgent repository root."
|
||||
exit 1
|
||||
fi
|
||||
|
||||
echo "Installing CI opencode integration..."
|
||||
echo "Installing CIAgent opencode integration..."
|
||||
echo " Source: ${CI_DIR}"
|
||||
echo " Target: ${OPENCODE_DIR}"
|
||||
echo ""
|
||||
@@ -143,15 +143,15 @@ fi
|
||||
|
||||
echo ""
|
||||
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
|
||||
echo " CI ► INSTALL COMPLETE"
|
||||
echo " CIAgent ► INSTALL COMPLETE"
|
||||
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
|
||||
echo ""
|
||||
echo " Copied: ${COPIED} files"
|
||||
echo " Skipped: ${SKIPPED} files"
|
||||
echo ""
|
||||
echo " Commands available: ci-init, ci-run, ci-quick, ci-status,"
|
||||
echo " ci-audit, ci-verify, ci-debug, ci-review, ci-ship,"
|
||||
echo " ci-rollback, ci-clarify"
|
||||
echo " Commands available: ciagent-init, ciagent-run, ciagent-quick, ciagent-status,"
|
||||
echo " ciagent-audit, ciagent-verify, ciagent-debug, ciagent-review, ciagent-ship,"
|
||||
echo " ciagent-rollback, ciagent-clarify"
|
||||
echo ""
|
||||
echo " Run --uninstall to remove."
|
||||
echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
|
||||
@@ -52,19 +52,19 @@ function applyTemplate(content, vars) {
|
||||
function install() {
|
||||
const pkgDir = getPackageDir();
|
||||
if (!pkgDir) {
|
||||
console.log("CI postinstall: Could not determine package directory. Skipping.");
|
||||
console.log("CIAgent postinstall: Could not determine package directory. Skipping.");
|
||||
return;
|
||||
}
|
||||
|
||||
const opencodeDir = path.join(pkgDir, "opencode");
|
||||
if (!fs.existsSync(opencodeDir)) {
|
||||
console.log("CI postinstall: opencode/ directory not found. Skipping.");
|
||||
console.log("CIAgent postinstall: opencode/ directory not found. Skipping.");
|
||||
return;
|
||||
}
|
||||
|
||||
if (!isGlobalInstall()) {
|
||||
console.log("CI postinstall: Not a global install. Skipping opencode integration.");
|
||||
console.log(" Run `npx ci-install` or `./scripts/install.sh` to install manually.");
|
||||
console.log("CIAgent postinstall: Not a global install. Skipping opencode integration.");
|
||||
console.log(" Run `npx ciagent-install` or `./scripts/install.sh` to install manually.");
|
||||
return;
|
||||
}
|
||||
|
||||
@@ -132,11 +132,11 @@ function install() {
|
||||
}
|
||||
}
|
||||
|
||||
console.log(`CI postinstall: ${copied} files installed, ${skipped} skipped.`);
|
||||
console.log(`CIAgent postinstall: ${copied} files installed, ${skipped} skipped.`);
|
||||
}
|
||||
|
||||
try {
|
||||
install();
|
||||
} catch (err) {
|
||||
console.log("CI postinstall: Non-fatal error:", err.message);
|
||||
console.log("CIAgent postinstall: Non-fatal error:", err.message);
|
||||
}
|
||||
@@ -0,0 +1,55 @@
|
||||
const { execSync } = require("child_process");
|
||||
|
||||
const ALLOWED_ENTRIES = ["dist/", "opencode/", "templates/", "LICENSE", "README.md", "package.json"];
|
||||
|
||||
function validatePack() {
|
||||
let output;
|
||||
try {
|
||||
output = execSync("npm pack --dry-run --json", { encoding: "utf-8" });
|
||||
} catch (err) {
|
||||
console.error("Failed to run npm pack --dry-run:", err.message);
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
let packFiles;
|
||||
try {
|
||||
const parsed = JSON.parse(output);
|
||||
packFiles = Array.isArray(parsed) ? parsed[0].files : parsed.files;
|
||||
} catch (err) {
|
||||
console.error("Failed to parse npm pack output:", err.message);
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
if (!packFiles || !Array.isArray(packFiles)) {
|
||||
console.error("No files array found in npm pack output");
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
const paths = packFiles.map((f) => f.path || f);
|
||||
|
||||
const unexpected = [];
|
||||
for (const p of paths) {
|
||||
const top = p.split("/")[0] || p;
|
||||
const allowed = ALLOWED_ENTRIES.some((entry) => {
|
||||
const e = entry.replace(/\/$/, "");
|
||||
return top === e || top === entry || p === entry;
|
||||
});
|
||||
if (!allowed) {
|
||||
unexpected.push(p);
|
||||
}
|
||||
}
|
||||
|
||||
if (unexpected.length > 0) {
|
||||
console.error("Unexpected files in npm pack output:");
|
||||
for (const f of unexpected) {
|
||||
console.error(` - ${f}`);
|
||||
}
|
||||
console.error("");
|
||||
console.error("Allowed top-level entries:", ALLOWED_ENTRIES.join(", "));
|
||||
process.exit(1);
|
||||
}
|
||||
|
||||
console.log("npm pack validation passed — all entries are allowed.");
|
||||
}
|
||||
|
||||
validatePack();
|
||||
@@ -0,0 +1,152 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { AgentContext, AgentResult } from "./base.js";
|
||||
import { PlannerAgent } from "./planner.js";
|
||||
import { ExecutorAgent } from "./executor.js";
|
||||
import { VerifierAgent } from "./verifier.js";
|
||||
import { ResearcherAgent } from "./researcher.js";
|
||||
import { ChallengerAgent } from "./challenger.js";
|
||||
import { SecurityAuditorAgent } from "./security-auditor.js";
|
||||
import { DebuggerAgent } from "./debugger.js";
|
||||
import { DocWriterAgent } from "./doc-writer.js";
|
||||
import { DocVerifierAgent } from "./doc-verifier.js";
|
||||
import { CodeReviewerAgent } from "./code-reviewer.js";
|
||||
import { IdeationAgent } from "./ideation-agent.js";
|
||||
import { RoadmapperAgent } from "./roadmapper.js";
|
||||
import { PlanCheckerAgent } from "./plan-checker.js";
|
||||
import { ProjectResearcherAgent } from "./project-researcher.js";
|
||||
import { ResearchSynthesizerAgent } from "./research-synthesizer.js";
|
||||
import { SolutionWriterAgent } from "./solution-writer.js";
|
||||
import { PhaseResearcherAgent } from "./phase-researcher.js";
|
||||
import { TesterAgent } from "./tester.js";
|
||||
|
||||
const NON_ORCHESTRATOR_AGENTS: Array<{ name: string; factory: () => { execute(ctx: AgentContext): Promise<AgentResult>; name: string } }> = [
|
||||
{ name: "planner", factory: () => new PlannerAgent() },
|
||||
{ name: "executor", factory: () => new ExecutorAgent() },
|
||||
{ name: "verifier", factory: () => new VerifierAgent() },
|
||||
{ name: "researcher", factory: () => new ResearcherAgent() },
|
||||
{ name: "challenger", factory: () => new ChallengerAgent() },
|
||||
{ name: "security-auditor", factory: () => new SecurityAuditorAgent() },
|
||||
{ name: "debugger", factory: () => new DebuggerAgent() },
|
||||
{ name: "doc-writer", factory: () => new DocWriterAgent() },
|
||||
{ name: "doc-verifier", factory: () => new DocVerifierAgent() },
|
||||
{ name: "code-reviewer", factory: () => new CodeReviewerAgent() },
|
||||
{ name: "ideation-agent", factory: () => new IdeationAgent() },
|
||||
{ name: "roadmapper", factory: () => new RoadmapperAgent() },
|
||||
{ name: "plan-checker", factory: () => new PlanCheckerAgent() },
|
||||
{ name: "project-researcher", factory: () => new ProjectResearcherAgent() },
|
||||
{ name: "research-synthesizer", factory: () => new ResearchSynthesizerAgent() },
|
||||
{ name: "solution-writer", factory: () => new SolutionWriterAgent() },
|
||||
{ name: "phase-researcher", factory: () => new PhaseResearcherAgent() },
|
||||
{ name: "tester", factory: () => new TesterAgent() },
|
||||
];
|
||||
|
||||
describe("All agents have intrinsic mechanical logic", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-mechanical-test-"));
|
||||
fs.mkdirSync(path.join(tempDir, ".ciagent"), { recursive: true });
|
||||
fs.mkdirSync(path.join(tempDir, "src"), { recursive: true });
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "config.json"),
|
||||
JSON.stringify({
|
||||
autonomy: { level: "full", escalation_hooks: [], clarify_budget: 10, decision_confidence_threshold: 0.6, max_revision_iterations: 3, max_verification_retries: 2, escalation_timeout_ms: 300000 },
|
||||
model_profile: "quality",
|
||||
parallelization: { enabled: false, max_concurrent_agents: 5, min_plans_for_parallel: 2 },
|
||||
verification: { automated_only: true, escalate_visual: true, escalate_external_integration: true, test_first: false },
|
||||
security: { auto_accept_low_severity: true, auto_mitigate_medium_severity: true, escalate_high_severity: true },
|
||||
git: { branching_strategy: "phase", auto_commit: false, auto_push: false },
|
||||
backend: { provider: "auto", agent_backends: { opencode: { enabled: false } }, llm_backends: {} },
|
||||
}, null, 2)
|
||||
);
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "PROJECT.md"),
|
||||
"# Project: Mechanical Test\n\n## Core Value\nValidate mechanical agent logic\n\n## Requirements\n### Active\n- REQ-01: Agent runs mechanically\n\n## Key Decisions\n\n## Constraints\n- Test only"
|
||||
);
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "REQUIREMENTS.md"),
|
||||
"# Requirements\n\n## V1\n### Functional\n| ID | Description | Priority |\n|------|------|------|\n| REQ-01 | Agent test | high |\n\n## Traceability\n| Requirement | Phase | Status |\n|------|------|------|\n| REQ-01 | 1 | in_progress |"
|
||||
);
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "ROADMAP.md"),
|
||||
"# Roadmap\n\n## Phases\n\n| # | Name | Description | Requirements | Depends On | Status |\n|------|------|------|------|------|------|\n| 1 | Test | Agent test phase | REQ-01 | | in_progress |"
|
||||
);
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "ARCHITECTURE.md"),
|
||||
"# Architecture\n\n## Overview\nTest architecture\n\n## Components\n| Name | Description | Boundaries | Depends On |\n|------|------|------|------|\n| core | Core | src/core/ | | \n\n## Build Order\n1. Build core\n\n## Data Flow\nTest flow"
|
||||
);
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "package.json"),
|
||||
JSON.stringify({ name: "mech-test", version: "0.1.0", scripts: { test: "echo ok" } })
|
||||
);
|
||||
|
||||
fs.writeFileSync(path.join(tempDir, "tsconfig.json"), "{}");
|
||||
fs.writeFileSync(path.join(tempDir, "src", "app.ts"), "export function main() { return 1; }");
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
try {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
} catch {}
|
||||
});
|
||||
|
||||
it("every non-orchestrator agent produces meaningful output without backend", async () => {
|
||||
const context: AgentContext = {
|
||||
project_path: tempDir,
|
||||
phase: 1,
|
||||
stage: "plan",
|
||||
specification: "Test mechanical agent logic execution",
|
||||
config_path: path.join(tempDir, ".ciagent", "config.json"),
|
||||
};
|
||||
|
||||
expect(NON_ORCHESTRATOR_AGENTS.length).toBe(18);
|
||||
|
||||
const results: Record<string, { success: boolean; error?: string; hasStubError: boolean }> = {};
|
||||
|
||||
for (const { name, factory } of NON_ORCHESTRATOR_AGENTS) {
|
||||
const agent = factory();
|
||||
expect(agent.name).toBe(name);
|
||||
|
||||
let result: AgentResult;
|
||||
|
||||
try {
|
||||
result = await agent.execute(context);
|
||||
} catch (err) {
|
||||
result = {
|
||||
success: false,
|
||||
output: "",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: 0,
|
||||
error: err instanceof Error ? err.message : String(err),
|
||||
};
|
||||
}
|
||||
|
||||
const errorText = (result.error || "").toLowerCase();
|
||||
const hasStubError =
|
||||
errorText.includes("requires an intelligence backend") ||
|
||||
errorText.includes("no intelligence backend available");
|
||||
|
||||
results[name] = {
|
||||
success: result.success,
|
||||
error: result.error,
|
||||
hasStubError,
|
||||
};
|
||||
}
|
||||
|
||||
const agentsWithStubErrors = Object.entries(results)
|
||||
.filter(([, r]) => r.hasStubError)
|
||||
.map(([name]) => name);
|
||||
|
||||
expect(agentsWithStubErrors).toEqual([]);
|
||||
});
|
||||
});
|
||||
+14
-1
@@ -1,4 +1,4 @@
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult, BackendUnavailableError, emptyBackendResult } from "../backends/types.js";
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult, BackendUnavailableError, emptyBackendResult, validateBackendResult } from "../backends/types.js";
|
||||
import { AgentName, AutonomyLevel } from "../types/config.js";
|
||||
|
||||
export interface AgentResult {
|
||||
@@ -18,9 +18,22 @@ export interface AgentContext {
|
||||
specification: string;
|
||||
config_path: string;
|
||||
backend?: IntelligenceBackend;
|
||||
project_slug?: string;
|
||||
}
|
||||
|
||||
export function backendResultToAgentResult(result: BackendResult): AgentResult {
|
||||
const validation = validateBackendResult(result);
|
||||
if (!validation.result) {
|
||||
return {
|
||||
success: false,
|
||||
output: "",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: 0,
|
||||
error: `BackendResult validation failed: ${validation.errors.join("; ")}`,
|
||||
};
|
||||
}
|
||||
return {
|
||||
success: result.success,
|
||||
output: result.output,
|
||||
|
||||
@@ -0,0 +1,57 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { ChallengerAgent } from "../agents/challenger.js";
|
||||
|
||||
describe("ChallengerAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-challenger-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("returns empty for no plan", () => {
|
||||
const agent = new ChallengerAgent();
|
||||
const issues = agent.mechanicalChallenge(tempDir, "/nonexistent/plan.md");
|
||||
|
||||
expect(issues).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("agent name is challenger", () => {
|
||||
const agent = new ChallengerAgent();
|
||||
expect(agent.name).toBe("challenger");
|
||||
});
|
||||
|
||||
it("detects missing must-haves in plan tasks", () => {
|
||||
const planDir = path.join(tempDir, ".opencode", "plans");
|
||||
fs.mkdirSync(planDir, { recursive: true });
|
||||
const planPath = path.join(planDir, "v0.1-plan.md");
|
||||
fs.writeFileSync(planPath, `# Plan\n\n| T-01 | 1 | |\n`);
|
||||
|
||||
const agent = new ChallengerAgent();
|
||||
const issues = agent.mechanicalChallenge(tempDir, planPath);
|
||||
|
||||
expect(issues.some((i) => i.type === "missing_must_haves")).toBe(true);
|
||||
});
|
||||
|
||||
it("validates clean plan with no issues", () => {
|
||||
const planDir = path.join(tempDir, ".opencode", "plans");
|
||||
fs.mkdirSync(planDir, { recursive: true });
|
||||
const planPath = path.join(planDir, "v0.1-plan.md");
|
||||
fs.writeFileSync(planPath, `# Plan\n\n| Task | Desc | Wave | Deps | Must-Haves | REQ-ID |\n|------|------|------|------|------------|--------|\n| T-01 | Do X | 1 | none | X works | REQ-01 |\n`);
|
||||
|
||||
const agent = new ChallengerAgent();
|
||||
const issues = agent.mechanicalChallenge(tempDir, planPath);
|
||||
|
||||
expect(issues).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("detects issue descriptions contain type", () => {
|
||||
const agent = new ChallengerAgent();
|
||||
expect(agent.name).toBe("challenger");
|
||||
});
|
||||
});
|
||||
@@ -1,5 +1,13 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface PlanIssue {
|
||||
type: "circular_dep" | "invalid_wave" | "missing_must_haves" | "uncovered_requirement";
|
||||
description: string;
|
||||
taskId?: string;
|
||||
}
|
||||
|
||||
export class ChallengerAgent extends BaseAgent {
|
||||
readonly name = "challenger";
|
||||
readonly description = "Stress-tests plans with binding verdicts. Only escalates when confidence < 0.60.";
|
||||
@@ -8,6 +16,7 @@ export class ChallengerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Challenging plan...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +24,91 @@ export class ChallengerAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const planPath = path.join(context.project_path, ".opencode", "plans", `v0.${context.phase}-plan.md`);
|
||||
const issues = this.mechanicalChallenge(context.project_path, planPath);
|
||||
const output = this.formatIssues(issues);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Plan challenge requires an intelligence backend. Configure one with: ci init --backend",
|
||||
success: issues.length === 0,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: issues.filter((i) => i.type === "circular_dep" || i.type === "uncovered_requirement").length,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: issues.length > 0 ? `${issues.length} plan issue(s) found` : undefined,
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalChallenge(projectPath: string, planPath: string): PlanIssue[] {
|
||||
const issues: PlanIssue[] = [];
|
||||
|
||||
if (!fs.existsSync(planPath)) {
|
||||
const altPaths = [
|
||||
path.join(projectPath, "PLAN.md"),
|
||||
path.join(projectPath, ".opencode", "plans", "plan.md"),
|
||||
];
|
||||
const found = altPaths.find((p) => fs.existsSync(p));
|
||||
if (!found) return issues;
|
||||
return this.validatePlan(found);
|
||||
}
|
||||
|
||||
return this.validatePlan(planPath);
|
||||
}
|
||||
|
||||
private validatePlan(planPath: string): PlanIssue[] {
|
||||
const issues: PlanIssue[] = [];
|
||||
const content = fs.readFileSync(planPath, "utf-8");
|
||||
|
||||
const taskLines = content.split("\n").filter((l) => /^\|\s*\w/.test(l) && !l.includes("---") && !/^\|\s*Task/i.test(l));
|
||||
for (const line of taskLines) {
|
||||
const cols = line.split("|").map((c) => c.trim()).filter(Boolean);
|
||||
if (cols.length < 1) continue;
|
||||
|
||||
const id = cols[0];
|
||||
|
||||
const meaningfulContent = cols.filter((c) => c.length > 5 && c !== id);
|
||||
if (meaningfulContent.length === 0) {
|
||||
issues.push({
|
||||
type: "missing_must_haves",
|
||||
description: `Task ${id} has no must-haves defined`,
|
||||
taskId: id,
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
const phaseSection = content.match(/##\s+Phase[\s\S]*?(?=##\s+|$)/i);
|
||||
if (phaseSection) {
|
||||
const reqIds = [...phaseSection[0].matchAll(/([A-Z]+-[A-Z]*\d+)/g)].map((m) => m[1]);
|
||||
if (reqIds.length > 0) {
|
||||
const taskHasReq = new Set<string>();
|
||||
for (const line of taskLines) {
|
||||
for (const req of reqIds) {
|
||||
if (line.includes(req)) {
|
||||
taskHasReq.add(req);
|
||||
}
|
||||
}
|
||||
}
|
||||
for (const req of reqIds) {
|
||||
if (!taskHasReq.has(req)) {
|
||||
issues.push({
|
||||
type: "uncovered_requirement",
|
||||
description: `Requirement ${req} is not covered by any task`,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return issues;
|
||||
}
|
||||
|
||||
private formatIssues(issues: PlanIssue[]): string {
|
||||
if (issues.length === 0) return "Plan validation passed — no issues found.";
|
||||
const lines: string[] = ["Plan Issues Found:", ""];
|
||||
for (const issue of issues) {
|
||||
lines.push(`[${issue.type}]${issue.taskId ? ` Task ${issue.taskId}:` : ""} ${issue.description}`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
+121
-4
@@ -1,5 +1,52 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface ReviewFinding {
|
||||
persona: "security" | "performance" | "maintainability";
|
||||
severity: "P0" | "P1" | "P2" | "P3";
|
||||
category: string;
|
||||
file: string;
|
||||
message: string;
|
||||
}
|
||||
|
||||
const SECURITY_PATTERNS: Array<{
|
||||
pattern: RegExp;
|
||||
severity: "P0" | "P1";
|
||||
category: string;
|
||||
message: string;
|
||||
}> = [
|
||||
{ pattern: /(?:exec|execSync|spawn|spawnSync)\s*\(\s*[^'"]*[\$`]/g, severity: "P0", category: "command_injection", message: "Command execution with dynamic input" },
|
||||
{ pattern: /eval\s*\(\s*[^'"]*\$\{/g, severity: "P0", category: "code_injection", message: "eval() with dynamic content" },
|
||||
{ pattern: /(?:password|secret|api[_-]?key|token)\s*[:=]\s*['"][^'"]{3,}['"]/gi, severity: "P0", category: "credential_exposure", message: "Hardcoded credential in source" },
|
||||
{ pattern: /catch\s*\(\w*\)\s*\{\s*\}/g, severity: "P0", category: "swallowed_errors", message: "Empty catch block" },
|
||||
{ pattern: /(?:__proto__|constructor\s*\[|prototype\s*\[)/g, severity: "P0", category: "prototype_pollution", message: "Prototype chain manipulation" },
|
||||
{ pattern: /(?:md5|sha1|des|rc4)\s*\(/gi, severity: "P1", category: "weak_crypto", message: "Weak cryptographic algorithm" },
|
||||
];
|
||||
|
||||
const PERFORMANCE_PATTERNS: Array<{
|
||||
pattern: RegExp;
|
||||
severity: "P1" | "P2";
|
||||
category: string;
|
||||
message: string;
|
||||
}> = [
|
||||
{ pattern: /(?:execSync|spawnSync)\s*\(\s*['"]/g, severity: "P1", category: "sync_exec", message: "Synchronous process spawn" },
|
||||
{ pattern: /setTimeout\s*\((?![^)]*clearTimeout)/g, severity: "P2", category: "timer_leak", message: "setTimeout without clearTimeout" },
|
||||
{ pattern: /express\.json\s*\(\s*\)/g, severity: "P1", category: "no_body_limit", message: "JSON body parser without size limit" },
|
||||
];
|
||||
|
||||
const MAINTAINABILITY_PATTERNS: Array<{
|
||||
pattern: RegExp;
|
||||
severity: "P1" | "P2" | "P3";
|
||||
category: string;
|
||||
message: string;
|
||||
}> = [
|
||||
{ pattern: /(?:as\s+any\b|:\s*any\b|<any>|any\[\s*\])/g, severity: "P1", category: "type_safety", message: "Use of 'any' type" },
|
||||
{ pattern: /\bvar\s+/g, severity: "P1", category: "modern_js", message: "Use of 'var'" },
|
||||
{ pattern: /\b(?:TODO|FIXME|HACK|XXX)\b/g, severity: "P2", category: "tech_debt", message: "Technical debt marker" },
|
||||
{ pattern: /console\.(log|warn|error)\s*\(/g, severity: "P2", category: "logging", message: "Direct console.log usage" },
|
||||
];
|
||||
|
||||
export class CodeReviewerAgent extends BaseAgent {
|
||||
readonly name = "code-reviewer";
|
||||
readonly description = "Multi-persona code review. Auto-applies P0 fixes. Flags P1+ for post-hoc review.";
|
||||
@@ -8,6 +55,7 @@ export class CodeReviewerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Running code review...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +63,83 @@ export class CodeReviewerAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const findings = this.mechanicalReview(context.project_path);
|
||||
const p0Count = findings.filter((f) => f.severity === "P0").length;
|
||||
const output = this.formatFindings(findings);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Code review requires an intelligence backend. Configure one with: ci init --backend",
|
||||
success: p0Count === 0,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: p0Count,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: p0Count > 0 ? `${p0Count} P0 finding(s) require immediate attention` : undefined,
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalReview(projectPath: string): ReviewFinding[] {
|
||||
const findings: ReviewFinding[] = [];
|
||||
const srcDir = path.join(projectPath, "src");
|
||||
|
||||
if (!fs.existsSync(srcDir)) return findings;
|
||||
|
||||
const allPatterns: Array<{
|
||||
patterns: typeof SECURITY_PATTERNS;
|
||||
persona: ReviewFinding["persona"];
|
||||
}> = [
|
||||
{ patterns: SECURITY_PATTERNS as unknown as typeof SECURITY_PATTERNS, persona: "security" },
|
||||
{ patterns: PERFORMANCE_PATTERNS as unknown as typeof SECURITY_PATTERNS, persona: "performance" },
|
||||
{ patterns: MAINTAINABILITY_PATTERNS as unknown as typeof SECURITY_PATTERNS, persona: "maintainability" },
|
||||
];
|
||||
|
||||
this.scanDirectory(srcDir, projectPath, allPatterns, findings);
|
||||
return findings;
|
||||
}
|
||||
|
||||
private scanDirectory(
|
||||
dir: string,
|
||||
projectPath: string,
|
||||
personaPatterns: Array<{ patterns: Array<{ pattern: RegExp; severity: "P0" | "P1" | "P2" | "P3"; category: string; message: string }>; persona: ReviewFinding["persona"] }>,
|
||||
findings: ReviewFinding[]
|
||||
): void {
|
||||
const entries = fs.readdirSync(dir, { withFileTypes: true });
|
||||
for (const entry of entries) {
|
||||
const fullPath = path.join(dir, entry.name);
|
||||
if (entry.isDirectory() && entry.name !== "node_modules" && entry.name !== ".git") {
|
||||
this.scanDirectory(fullPath, projectPath, personaPatterns, findings);
|
||||
} else if (
|
||||
entry.isFile() &&
|
||||
entry.name.endsWith(".ts") &&
|
||||
!entry.name.endsWith(".test.ts") &&
|
||||
!entry.name.endsWith(".d.ts")
|
||||
) {
|
||||
const content = fs.readFileSync(fullPath, "utf-8");
|
||||
for (const { patterns, persona } of personaPatterns) {
|
||||
for (const { pattern, severity, category, message } of patterns) {
|
||||
pattern.lastIndex = 0;
|
||||
if (pattern.test(content)) {
|
||||
findings.push({
|
||||
persona,
|
||||
severity: severity as ReviewFinding["severity"],
|
||||
category,
|
||||
file: path.relative(projectPath, fullPath),
|
||||
message,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
private formatFindings(findings: ReviewFinding[]): string {
|
||||
if (findings.length === 0) return "No findings — code review passed.";
|
||||
const lines: string[] = ["Code Review Findings:", ""];
|
||||
for (const f of findings) {
|
||||
lines.push(`[${f.persona}|${f.severity}] ${f.category}: ${f.message} (${f.file})`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,51 @@
|
||||
import { DebuggerAgent } from "../agents/debugger.js";
|
||||
|
||||
describe("DebuggerAgent", () => {
|
||||
it("parses standard V8 stack traces", () => {
|
||||
const agent = new DebuggerAgent();
|
||||
const trace = `Error: something broke
|
||||
at Object.doWork (src/app.ts:42:15)
|
||||
at processTicksAndRejections (node:internal/process/task_queues:95:5)`;
|
||||
|
||||
const frames = (agent as unknown as { parseStackTrace: (t: string) => Array<{ file: string; line: number; function?: string }> }).parseStackTrace(trace);
|
||||
|
||||
expect(frames.length).toBeGreaterThan(0);
|
||||
expect(frames[0].file).toContain("src/app.ts");
|
||||
expect(frames[0].line).toBe(42);
|
||||
expect(frames[0].function).toContain("doWork");
|
||||
});
|
||||
|
||||
it("parses simple file:line:column traces", () => {
|
||||
const agent = new DebuggerAgent();
|
||||
const trace = "src/utils.ts:10:5";
|
||||
|
||||
const frames = (agent as unknown as { parseStackTrace: (t: string) => Array<{ file: string; line: number }> }).parseStackTrace(trace);
|
||||
|
||||
expect(frames.length).toBeGreaterThan(0);
|
||||
expect(frames[0].file).toBe("src/utils.ts");
|
||||
expect(frames[0].line).toBe(10);
|
||||
});
|
||||
|
||||
it("returns empty for non-stack-trace input", () => {
|
||||
const agent = new DebuggerAgent();
|
||||
const frames = (agent as unknown as { parseStackTrace: (t: string) => Array<unknown> }).parseStackTrace("this is just text with no frames");
|
||||
|
||||
expect(frames).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("agent name is debugger", () => {
|
||||
const agent = new DebuggerAgent();
|
||||
expect(agent.name).toBe("debugger");
|
||||
});
|
||||
|
||||
it("parses multiple stack frames", () => {
|
||||
const agent = new DebuggerAgent();
|
||||
const trace = `Error: fail
|
||||
at foo (src/a.ts:1:1)
|
||||
at bar (src/b.ts:2:2)
|
||||
at baz (src/c.ts:3:3)`;
|
||||
|
||||
const frames = (agent as unknown as { parseStackTrace: (t: string) => Array<unknown> }).parseStackTrace(trace);
|
||||
expect(frames.length).toBeGreaterThanOrEqual(3);
|
||||
});
|
||||
});
|
||||
+137
-4
@@ -1,5 +1,21 @@
|
||||
import { execSync } from "node:child_process";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface StackFrame {
|
||||
file: string;
|
||||
line: number;
|
||||
column?: number;
|
||||
function?: string;
|
||||
}
|
||||
|
||||
interface DebugResult {
|
||||
rootFile: string;
|
||||
rootLine: number;
|
||||
rootFunction?: string;
|
||||
introducingCommit?: string;
|
||||
suggestion?: string;
|
||||
}
|
||||
|
||||
export class DebuggerAgent extends BaseAgent {
|
||||
readonly name = "debugger";
|
||||
readonly description = "Autonomous debugging. Auto-fixes when root cause confidence > 0.60, escalates otherwise.";
|
||||
@@ -8,6 +24,7 @@ export class DebuggerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Running autonomous debug...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +32,130 @@ export class DebuggerAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const debugResult = this.mechanicalDebug(context.project_path, context.specification);
|
||||
const output = this.formatDebugResult(debugResult);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Debugging requires an intelligence backend. Configure one with: ci init --backend",
|
||||
success: !!debugResult.introducingCommit,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: debugResult.introducingCommit ? 0 : 1,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: debugResult.introducingCommit ? undefined : "Could not identify introducing commit via git bisect",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalDebug(projectPath: string, stackTrace: string): DebugResult {
|
||||
const frames = this.parseStackTrace(stackTrace);
|
||||
|
||||
if (frames.length === 0) {
|
||||
return { rootFile: "", rootLine: 0, suggestion: "No parseable stack frames found in input" };
|
||||
}
|
||||
|
||||
const topFrame = frames[0];
|
||||
const result: DebugResult = {
|
||||
rootFile: topFrame.file,
|
||||
rootLine: topFrame.line,
|
||||
rootFunction: topFrame.function,
|
||||
};
|
||||
|
||||
try {
|
||||
const bisectResult = this.gitBisect(projectPath, topFrame.file, topFrame.line);
|
||||
if (bisectResult) {
|
||||
result.introducingCommit = bisectResult;
|
||||
result.suggestion = `git revert ${bisectResult}`;
|
||||
}
|
||||
} catch {}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
parseStackTrace(trace: string): StackFrame[] {
|
||||
const frames: StackFrame[] = [];
|
||||
const patterns = [
|
||||
/at\s+(.+?)\s+\((.+?):(\d+):(\d+)\)/g,
|
||||
/at\s+(.+?)\s+\((.+?):(\d+)\)/g,
|
||||
/at\s+(.+?):(\d+):(\d+)/g,
|
||||
/(.+?):(\d+):(\d+)/g,
|
||||
];
|
||||
|
||||
for (const pattern of patterns) {
|
||||
let match;
|
||||
while ((match = pattern.exec(trace)) !== null) {
|
||||
if (pattern === patterns[0] || pattern === patterns[1]) {
|
||||
frames.push({
|
||||
function: match[1],
|
||||
file: match[2],
|
||||
line: parseInt(match[3]),
|
||||
column: match[4] ? parseInt(match[4]) : undefined,
|
||||
});
|
||||
} else {
|
||||
frames.push({
|
||||
file: match[1],
|
||||
line: parseInt(match[2]),
|
||||
column: match[3] ? parseInt(match[3]) : undefined,
|
||||
});
|
||||
}
|
||||
}
|
||||
if (frames.length > 0) break;
|
||||
}
|
||||
|
||||
return frames;
|
||||
}
|
||||
|
||||
private gitBisect(projectPath: string, file: string, line: number): string | null {
|
||||
try {
|
||||
execSync("git bisect start", { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
execSync("git bisect bad HEAD", { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
|
||||
try {
|
||||
const firstCommit = execSync("git rev-list --max-parents=0 HEAD", {
|
||||
cwd: projectPath, encoding: "utf-8", stdio: "pipe", timeout: 5000,
|
||||
}).trim();
|
||||
execSync(`git bisect good ${firstCommit}`, { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
} catch {
|
||||
execSync("git bisect good HEAD~20", { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
}
|
||||
|
||||
let result: string | null = null;
|
||||
for (let i = 0; i < 50; i++) {
|
||||
const output = execSync("git bisect run true", {
|
||||
cwd: projectPath, encoding: "utf-8", stdio: "pipe", timeout: 30000,
|
||||
});
|
||||
if (output.includes("is the first bad commit")) {
|
||||
const hashMatch = output.match(/^([a-f0-9]+)/m);
|
||||
result = hashMatch ? hashMatch[1] : null;
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
try {
|
||||
execSync("git bisect reset", { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
} catch {}
|
||||
|
||||
return result;
|
||||
} catch {
|
||||
try {
|
||||
execSync("git bisect reset", { cwd: projectPath, stdio: "pipe", timeout: 5000 });
|
||||
} catch {}
|
||||
return null;
|
||||
}
|
||||
}
|
||||
|
||||
private formatDebugResult(result: DebugResult): string {
|
||||
const lines: string[] = ["Debug Analysis:", ""];
|
||||
if (result.rootFile) {
|
||||
lines.push(`Root location: ${result.rootFile}:${result.rootLine}`);
|
||||
if (result.rootFunction) lines.push(`Function: ${result.rootFunction}`);
|
||||
}
|
||||
if (result.introducingCommit) {
|
||||
lines.push(`Introduced by: ${result.introducingCommit}`);
|
||||
}
|
||||
if (result.suggestion) {
|
||||
lines.push(`Suggestion: ${result.suggestion}`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,167 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { DocVerifierAgent } from "../agents/doc-verifier.js";
|
||||
|
||||
function setupValidProject(tempDir: string): void {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
const agentsDir = path.join(srcDir, "agents");
|
||||
|
||||
const agentFiles = [
|
||||
"orchestrator.ts", "planner.ts", "executor.ts", "verifier.ts",
|
||||
"researcher.ts", "challenger.ts", "security-auditor.ts", "debugger.ts",
|
||||
"doc-writer.ts", "doc-verifier.ts", "code-reviewer.ts", "ideation-agent.ts",
|
||||
"roadmapper.ts", "plan-checker.ts", "project-researcher.ts",
|
||||
"research-synthesizer.ts", "solution-writer.ts", "phase-researcher.ts", "tester.ts",
|
||||
];
|
||||
|
||||
for (const dir of ["agents", "backends", "cli", "core", "types", "utils", "verification"]) {
|
||||
fs.mkdirSync(path.join(srcDir, dir), { recursive: true });
|
||||
}
|
||||
|
||||
fs.writeFileSync(path.join(agentsDir, "base.ts"), "");
|
||||
fs.writeFileSync(path.join(agentsDir, "index.ts"), "");
|
||||
for (const f of agentFiles) {
|
||||
fs.writeFileSync(path.join(agentsDir, f), "export class X {}");
|
||||
}
|
||||
|
||||
fs.writeFileSync(path.join(srcDir, "version.ts"), 'export const VERSION = "0.8.0";');
|
||||
fs.writeFileSync(path.join(tempDir, "package.json"), JSON.stringify({ version: "0.8.0" }));
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "AGENTS.md"),
|
||||
"19 agent implementations\n44 test suites\n"
|
||||
);
|
||||
|
||||
for (let i = 0; i < 44; i++) {
|
||||
fs.writeFileSync(path.join(srcDir, `test-${i}.test.ts`), "test('x', () => {});");
|
||||
}
|
||||
}
|
||||
|
||||
describe("DocVerifierAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-doc-verifier-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("valid project passes with no findings", () => {
|
||||
setupValidProject(tempDir);
|
||||
|
||||
const agent = new DocVerifierAgent();
|
||||
const findings = agent.mechanicalDocVerify(tempDir);
|
||||
|
||||
expect(findings).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("detects missing agent via agent_mismatch", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
const agentsDir = path.join(srcDir, "agents");
|
||||
fs.mkdirSync(agentsDir, { recursive: true });
|
||||
|
||||
const agentFiles = [
|
||||
"orchestrator.ts", "planner.ts", "executor.ts", "verifier.ts",
|
||||
"researcher.ts", "challenger.ts", "security-auditor.ts",
|
||||
];
|
||||
|
||||
fs.writeFileSync(path.join(agentsDir, "base.ts"), "");
|
||||
fs.writeFileSync(path.join(agentsDir, "index.ts"), "");
|
||||
for (const f of agentFiles) {
|
||||
fs.writeFileSync(path.join(agentsDir, f), "export class X {}");
|
||||
}
|
||||
|
||||
fs.writeFileSync(path.join(srcDir, "version.ts"), 'export const VERSION = "0.8.0";');
|
||||
fs.writeFileSync(path.join(tempDir, "package.json"), JSON.stringify({ version: "0.8.0" }));
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "AGENTS.md"),
|
||||
"19 agent implementations\n44 test suites\n"
|
||||
);
|
||||
|
||||
const agent = new DocVerifierAgent();
|
||||
const findings = agent.mechanicalDocVerify(tempDir);
|
||||
|
||||
const mismatch = findings.find((f) => f.type === "agent_mismatch");
|
||||
expect(mismatch).toBeDefined();
|
||||
expect(mismatch!.severity).toBe("P1");
|
||||
});
|
||||
|
||||
it("detects version drift between package.json and src/version.ts", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
|
||||
fs.writeFileSync(path.join(tempDir, "package.json"), JSON.stringify({ version: "0.8.0" }));
|
||||
fs.writeFileSync(path.join(srcDir, "version.ts"), 'export const VERSION = "0.9.0";');
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "AGENTS.md"),
|
||||
"19 agent implementations\n44 test suites\n"
|
||||
);
|
||||
|
||||
const agent = new DocVerifierAgent();
|
||||
const findings = agent.mechanicalDocVerify(tempDir);
|
||||
|
||||
const drift = findings.find((f) => f.type === "version_drift");
|
||||
expect(drift).toBeDefined();
|
||||
expect(drift!.severity).toBe("P0");
|
||||
expect(drift!.expected).toContain("0.8.0");
|
||||
expect(drift!.actual).toContain("0.9.0");
|
||||
});
|
||||
|
||||
it("detects architecture stale when expected directory missing", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
const limitedDirs = ["agents", "types"];
|
||||
for (const dir of limitedDirs) {
|
||||
fs.mkdirSync(path.join(srcDir, dir), { recursive: true });
|
||||
}
|
||||
|
||||
fs.writeFileSync(path.join(srcDir, "version.ts"), 'export const VERSION = "0.8.0";');
|
||||
fs.writeFileSync(path.join(tempDir, "package.json"), JSON.stringify({ version: "0.8.0" }));
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "AGENTS.md"),
|
||||
"19 agent implementations\n44 test suites\n"
|
||||
);
|
||||
|
||||
const agent = new DocVerifierAgent();
|
||||
const findings = agent.mechanicalDocVerify(tempDir);
|
||||
|
||||
const stale = findings.filter((f) => f.type === "architecture_stale");
|
||||
expect(stale.length).toBeGreaterThan(0);
|
||||
expect(stale.some((f) => f.expected.includes("backends"))).toBe(true);
|
||||
});
|
||||
|
||||
it("agent name is doc-verifier", () => {
|
||||
const agent = new DocVerifierAgent();
|
||||
expect(agent.name).toBe("doc-verifier");
|
||||
});
|
||||
|
||||
it("findings include type and severity fields", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
|
||||
fs.writeFileSync(path.join(tempDir, "package.json"), JSON.stringify({ version: "1.0.0" }));
|
||||
fs.writeFileSync(path.join(srcDir, "version.ts"), 'export const VERSION = "2.0.0";');
|
||||
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "AGENTS.md"),
|
||||
"19 agent implementations\n99 test suites\n"
|
||||
);
|
||||
|
||||
const agent = new DocVerifierAgent();
|
||||
const findings = agent.mechanicalDocVerify(tempDir);
|
||||
|
||||
for (const f of findings) {
|
||||
expect(f.type).toBeDefined();
|
||||
expect(f.severity).toBeDefined();
|
||||
expect(f.expected).toBeDefined();
|
||||
expect(f.actual).toBeDefined();
|
||||
expect(["P0", "P1", "P2"]).toContain(f.severity);
|
||||
expect(["agent_mismatch", "version_drift", "architecture_stale", "test_count_drift"]).toContain(f.type);
|
||||
}
|
||||
});
|
||||
});
|
||||
+186
-4
@@ -1,13 +1,26 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface DocFinding {
|
||||
type: "agent_mismatch" | "version_drift" | "architecture_stale" | "test_count_drift";
|
||||
severity: "P0" | "P1" | "P2";
|
||||
expected: string;
|
||||
actual: string;
|
||||
file?: string;
|
||||
}
|
||||
|
||||
const KNOWN_COMPONENTS = ["agents", "backends", "cli", "core", "types", "utils", "verification"];
|
||||
|
||||
export class DocVerifierAgent extends BaseAgent {
|
||||
readonly name = "doc-verifier";
|
||||
readonly description = "Verifies documentation matches live codebase.";
|
||||
readonly description = "Verifies documentation matches live codebase via mechanical cross-checks.";
|
||||
readonly workflow = "verify";
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Verifying documentation...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +28,183 @@ export class DocVerifierAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const findings = this.mechanicalDocVerify(context.project_path);
|
||||
const output = this.formatFindings(findings);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Documentation verification requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalDocVerify(projectPath: string): DocFinding[] {
|
||||
const findings: DocFinding[] = [];
|
||||
|
||||
const agentFinding = this.checkAgentRegistry(projectPath);
|
||||
if (agentFinding) findings.push(agentFinding);
|
||||
|
||||
const versionFinding = this.checkVersionConsistency(projectPath);
|
||||
if (versionFinding) findings.push(versionFinding);
|
||||
|
||||
const archFindings = this.checkArchitectureTree(projectPath);
|
||||
findings.push(...archFindings);
|
||||
|
||||
const testFinding = this.checkTestCount(projectPath);
|
||||
if (testFinding) findings.push(testFinding);
|
||||
|
||||
return findings;
|
||||
}
|
||||
|
||||
checkAgentRegistry(projectPath: string): DocFinding | null {
|
||||
const agentsDir = path.join(projectPath, "src", "agents");
|
||||
if (!fs.existsSync(agentsDir)) return null;
|
||||
|
||||
const agentFiles = fs.readdirSync(agentsDir)
|
||||
.filter((f) => f.endsWith(".ts") && !f.endsWith(".test.ts") && !f.endsWith(".d.ts") && f !== "index.ts" && f !== "base.ts");
|
||||
|
||||
const agentsMdPath = path.join(projectPath, "AGENTS.md");
|
||||
if (!fs.existsSync(agentsMdPath)) return null;
|
||||
|
||||
const agentsMdContent = fs.readFileSync(agentsMdPath, "utf-8");
|
||||
const agentCountMatch = agentsMdContent.match(/(\d+)\s+agent/i);
|
||||
|
||||
if (!agentCountMatch) return null;
|
||||
|
||||
const claimedCount = parseInt(agentCountMatch[1], 10);
|
||||
const actualCount = agentFiles.length;
|
||||
|
||||
if (actualCount !== claimedCount) {
|
||||
return {
|
||||
type: "agent_mismatch",
|
||||
severity: "P1",
|
||||
expected: `${claimedCount} agents`,
|
||||
actual: `${actualCount} agents`,
|
||||
file: "AGENTS.md",
|
||||
};
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
checkVersionConsistency(projectPath: string): DocFinding | null {
|
||||
const pkgPath = path.join(projectPath, "package.json");
|
||||
const versionPath = path.join(projectPath, "src", "version.ts");
|
||||
|
||||
if (!fs.existsSync(pkgPath) || !fs.existsSync(versionPath)) return null;
|
||||
|
||||
const pkg = JSON.parse(fs.readFileSync(pkgPath, "utf-8"));
|
||||
const pkgVersion = pkg.version;
|
||||
|
||||
const versionContent = fs.readFileSync(versionPath, "utf-8");
|
||||
const match = versionContent.match(/VERSION\s*=\s*"([^"]+)"/);
|
||||
if (!match) return null;
|
||||
|
||||
const srcVersion = match[1];
|
||||
|
||||
if (pkgVersion !== srcVersion) {
|
||||
return {
|
||||
type: "version_drift",
|
||||
severity: "P0",
|
||||
expected: `package.json=${pkgVersion}`,
|
||||
actual: `src/version.ts=${srcVersion}`,
|
||||
file: "src/version.ts",
|
||||
};
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
checkArchitectureTree(projectPath: string): DocFinding[] {
|
||||
const findings: DocFinding[] = [];
|
||||
const srcDir = path.join(projectPath, "src");
|
||||
if (!fs.existsSync(srcDir)) return findings;
|
||||
|
||||
const actualDirs = new Set(
|
||||
fs.readdirSync(srcDir, { withFileTypes: true })
|
||||
.filter((d) => d.isDirectory())
|
||||
.map((d) => d.name)
|
||||
);
|
||||
|
||||
const archMdPath = this.resolveArchMdPath(projectPath);
|
||||
const archFile = archMdPath ? path.relative(projectPath, archMdPath) : "ARCHITECTURE.md";
|
||||
|
||||
for (const expected of KNOWN_COMPONENTS) {
|
||||
if (!actualDirs.has(expected)) {
|
||||
findings.push({
|
||||
type: "architecture_stale",
|
||||
severity: "P2",
|
||||
expected: `src/${expected}/ directory`,
|
||||
actual: "directory not found",
|
||||
file: archFile,
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
return findings;
|
||||
}
|
||||
|
||||
checkTestCount(projectPath: string): DocFinding | null {
|
||||
const agentsMdPath = path.join(projectPath, "AGENTS.md");
|
||||
if (!fs.existsSync(agentsMdPath)) return null;
|
||||
|
||||
const agentsMdContent = fs.readFileSync(agentsMdPath, "utf-8");
|
||||
const testCountMatch = agentsMdContent.match(/(\d+)\s+test\s+suit/i);
|
||||
|
||||
if (!testCountMatch) return null;
|
||||
|
||||
const claimedCount = parseInt(testCountMatch[1], 10);
|
||||
const actualCount = this.countTestFiles(path.join(projectPath, "src"));
|
||||
|
||||
if (actualCount !== claimedCount) {
|
||||
return {
|
||||
type: "test_count_drift",
|
||||
severity: "P1",
|
||||
expected: `${claimedCount} test suites`,
|
||||
actual: `${actualCount} test suites`,
|
||||
file: "AGENTS.md",
|
||||
};
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
private resolveArchMdPath(projectPath: string): string | null {
|
||||
const ciagentArch = path.join(projectPath, ".ciagent", "ARCHITECTURE.md");
|
||||
if (fs.existsSync(ciagentArch)) return ciagentArch;
|
||||
|
||||
const ciArch = path.join(projectPath, ".ci", "ARCHITECTURE.md");
|
||||
if (fs.existsSync(ciArch)) return ciArch;
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
private countTestFiles(dir: string): number {
|
||||
if (!fs.existsSync(dir)) return 0;
|
||||
|
||||
let count = 0;
|
||||
const entries = fs.readdirSync(dir, { withFileTypes: true });
|
||||
for (const entry of entries) {
|
||||
const fullPath = path.join(dir, entry.name);
|
||||
if (entry.isDirectory() && entry.name !== "node_modules" && entry.name !== ".git") {
|
||||
count += this.countTestFiles(fullPath);
|
||||
} else if (entry.isFile() && entry.name.endsWith(".test.ts")) {
|
||||
count++;
|
||||
}
|
||||
}
|
||||
return count;
|
||||
}
|
||||
|
||||
private formatFindings(findings: DocFinding[]): string {
|
||||
if (findings.length === 0) return "Documentation verification passed — no drift detected.";
|
||||
const lines: string[] = ["Documentation Findings:", ""];
|
||||
for (const f of findings) {
|
||||
lines.push(`[${f.type}|${f.severity}] expected: ${f.expected}, actual: ${f.actual}${f.file ? ` (${f.file})` : ""}`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,65 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { DocWriterAgent } from "../agents/doc-writer.js";
|
||||
|
||||
describe("DocWriterAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-doc-writer-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("updates ROADMAP.md phase status to complete", () => {
|
||||
const ciDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciDir, "ROADMAP.md"), "# Roadmap\n\n| 1 | Setup | in progress | scaffold |\n");
|
||||
|
||||
const agent = new DocWriterAgent();
|
||||
const updates = agent.mechanicalDocUpdate(tempDir, 1);
|
||||
|
||||
const roadmapContent = fs.readFileSync(path.join(ciDir, "ROADMAP.md"), "utf-8");
|
||||
expect(roadmapContent).toContain("complete");
|
||||
});
|
||||
|
||||
it("returns no updates when no .ciagent dir", () => {
|
||||
const agent = new DocWriterAgent();
|
||||
const updates = agent.mechanicalDocUpdate(tempDir, 1);
|
||||
|
||||
expect(updates).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("agent name is doc-writer", () => {
|
||||
const agent = new DocWriterAgent();
|
||||
expect(agent.name).toBe("doc-writer");
|
||||
});
|
||||
|
||||
it("updates REQUIREMENTS.md pending to covered", () => {
|
||||
const ciDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciDir, "REQUIREMENTS.md"),
|
||||
"# Req\n\n| REQ-01 | Do thing | P0 | 1 | pending |\n"
|
||||
);
|
||||
|
||||
const agent = new DocWriterAgent();
|
||||
const updates = agent.mechanicalDocUpdate(tempDir, 1);
|
||||
|
||||
const reqContent = fs.readFileSync(path.join(ciDir, "REQUIREMENTS.md"), "utf-8");
|
||||
expect(reqContent).toContain("covered");
|
||||
});
|
||||
|
||||
it("skips update when status already complete", () => {
|
||||
const ciDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciDir, "ROADMAP.md"), "# Roadmap\n\n| 1 | Setup | complete | scaffold |\n");
|
||||
|
||||
const agent = new DocWriterAgent();
|
||||
const updates = agent.mechanicalDocUpdate(tempDir, 1);
|
||||
|
||||
expect(updates).toHaveLength(0);
|
||||
});
|
||||
});
|
||||
+162
-5
@@ -1,13 +1,22 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { execSync } from "node:child_process";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface DocUpdate {
|
||||
file: string;
|
||||
updates: string[];
|
||||
}
|
||||
|
||||
export class DocWriterAgent extends BaseAgent {
|
||||
readonly name = "doc-writer";
|
||||
readonly description = "Autonomous documentation writer. No behavioral changes from Learnship.";
|
||||
readonly description = "Autonomous documentation writer.";
|
||||
readonly workflow = "execute";
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Writing documentation...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +24,162 @@ export class DocWriterAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const updates = this.mechanicalDocUpdate(context.project_path, context.phase);
|
||||
const output = this.formatUpdates(updates);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Documentation writing requires an intelligence backend.",
|
||||
artifacts_created: [],
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: updates.map((u) => u.file),
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalDocUpdate(projectPath: string, phase: number): DocUpdate[] {
|
||||
const updates: DocUpdate[] = [];
|
||||
const ciDir = path.join(projectPath, ".ciagent");
|
||||
|
||||
if (!fs.existsSync(ciDir)) return updates;
|
||||
|
||||
const roadmapUpdates = this.updateRoadmapPhaseStatus(ciDir, phase);
|
||||
if (roadmapUpdates.length > 0) {
|
||||
updates.push({ file: ".ciagent/ROADMAP.md", updates: roadmapUpdates });
|
||||
}
|
||||
|
||||
const reqUpdates = this.updateRequirementsStatus(projectPath, phase);
|
||||
if (reqUpdates.length > 0) {
|
||||
updates.push({ file: ".ciagent/REQUIREMENTS.md", updates: reqUpdates });
|
||||
}
|
||||
|
||||
const decisionUpdates = this.updateProjectDecisions(ciDir, phase);
|
||||
if (decisionUpdates.length > 0) {
|
||||
updates.push({ file: ".ciagent/PROJECT.md", updates: decisionUpdates });
|
||||
}
|
||||
|
||||
if (updates.length > 0) {
|
||||
try {
|
||||
execSync("git add -A", { cwd: projectPath, stdio: "pipe" });
|
||||
} catch {}
|
||||
}
|
||||
|
||||
return updates;
|
||||
}
|
||||
|
||||
private updateRoadmapPhaseStatus(ciDir: string, phase: number): string[] {
|
||||
const roadmapPath = path.join(ciDir, "ROADMAP.md");
|
||||
if (!fs.existsSync(roadmapPath)) return [];
|
||||
|
||||
const content = fs.readFileSync(roadmapPath, "utf-8");
|
||||
const phasePattern = new RegExp(
|
||||
`\\|\\s*${phase}\\s*\\|([^|]+)\\|([^|]+)\\|`,
|
||||
"g"
|
||||
);
|
||||
|
||||
let updated = content;
|
||||
let match;
|
||||
const updates: string[] = [];
|
||||
|
||||
while ((match = phasePattern.exec(content)) !== null) {
|
||||
const currentStatus = match[2].trim().toLowerCase();
|
||||
if (currentStatus !== "complete") {
|
||||
updated = updated.replace(
|
||||
match[0],
|
||||
match[0].replace(/in.progress|pending|not.started/i, "complete")
|
||||
);
|
||||
updates.push(`Phase ${phase}: status → complete`);
|
||||
}
|
||||
}
|
||||
|
||||
if (updated !== content) {
|
||||
fs.writeFileSync(roadmapPath, updated, "utf-8");
|
||||
}
|
||||
|
||||
return updates;
|
||||
}
|
||||
|
||||
private updateRequirementsStatus(projectPath: string, phase: number): string[] {
|
||||
const reqPath = path.join(projectPath, ".ciagent", "REQUIREMENTS.md");
|
||||
if (!fs.existsSync(reqPath)) return [];
|
||||
|
||||
const content = fs.readFileSync(reqPath, "utf-8");
|
||||
let updated = content;
|
||||
const updates: string[] = [];
|
||||
|
||||
const pendingForPhase = content.match(
|
||||
new RegExp(`\\|[^|]*\\|[^|]*\\|[^|]*\\|\\s*${phase}\\s*\\|\\s*pending\\s*\\|`, "g")
|
||||
);
|
||||
if (pendingForPhase) {
|
||||
for (const line of pendingForPhase) {
|
||||
updated = updated.replace(line, line.replace(/pending/, "covered"));
|
||||
updates.push(`Requirement updated to covered (phase ${phase})`);
|
||||
}
|
||||
}
|
||||
|
||||
if (updated !== content) {
|
||||
fs.writeFileSync(reqPath, updated, "utf-8");
|
||||
}
|
||||
|
||||
return updates;
|
||||
}
|
||||
|
||||
private updateProjectDecisions(ciDir: string, phase: number): string[] {
|
||||
const projectPath = path.join(ciDir, "PROJECT.md");
|
||||
if (!fs.existsSync(projectPath)) return [];
|
||||
|
||||
const content = fs.readFileSync(projectPath, "utf-8");
|
||||
const gitLogDecisions = this.getRecentDecisions(phase);
|
||||
|
||||
if (gitLogDecisions.length === 0) return [];
|
||||
|
||||
const updates: string[] = [];
|
||||
for (const d of gitLogDecisions) {
|
||||
if (!content.includes(d.id)) {
|
||||
updates.push(`Added decision ${d.id}: ${d.decision}`);
|
||||
}
|
||||
}
|
||||
|
||||
return updates;
|
||||
}
|
||||
|
||||
private getRecentDecisions(phase: number): Array<{ id: string; decision: string }> {
|
||||
try {
|
||||
const raw = execSync(
|
||||
`git log --all --max-count=20 --format="%B%x01"`,
|
||||
{ encoding: "utf-8", stdio: ["pipe", "pipe", "pipe"], timeout: 5000 }
|
||||
);
|
||||
const decisions: Array<{ id: string; decision: string }> = [];
|
||||
const entries = raw.split("\x01").filter(Boolean);
|
||||
|
||||
for (const entry of entries) {
|
||||
const ciMatch = entry.match(/---ci---[\s\S]*?---\/ci---/);
|
||||
if (!ciMatch) continue;
|
||||
const phaseMatch = ciMatch[0].match(/phase:\s*(\d+)/);
|
||||
if (!phaseMatch || parseInt(phaseMatch[1]) !== phase) continue;
|
||||
|
||||
const decMatches = [...ciMatch[0].matchAll(/id:\s*(D-\d+)[\s\S]*?decision:\s*(.+)/g)];
|
||||
for (const m of decMatches) {
|
||||
decisions.push({ id: m[1], decision: m[2].trim() });
|
||||
}
|
||||
}
|
||||
|
||||
return decisions;
|
||||
} catch {
|
||||
return [];
|
||||
}
|
||||
}
|
||||
|
||||
private formatUpdates(updates: DocUpdate[]): string {
|
||||
if (updates.length === 0) return "No documentation updates needed.";
|
||||
const lines: string[] = ["Documentation Updates:", ""];
|
||||
for (const u of updates) {
|
||||
lines.push(`${u.file}:`);
|
||||
for (const update of u.updates) {
|
||||
lines.push(` - ${update}`);
|
||||
}
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,79 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { ExecutorAgent } from "../agents/executor.js";
|
||||
import { AgentContext } from "../agents/base.js";
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult } from "../backends/types.js";
|
||||
import { emptyTokenUsage } from "../backends/types.js";
|
||||
|
||||
class MockBackend implements IntelligenceBackend {
|
||||
readonly name = "mock";
|
||||
readonly type = "llm" as const;
|
||||
async isAvailable(): Promise<boolean> { return true; }
|
||||
async execute(request: BackendRequest): Promise<BackendResult> {
|
||||
return {
|
||||
success: true,
|
||||
output: `Mock backend executed: ${request.task.slice(0, 50)}`,
|
||||
artifacts: [],
|
||||
decisions: [],
|
||||
escalations: [],
|
||||
usage: emptyTokenUsage(),
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
function createTempDir(): string {
|
||||
return fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-executor-test-"));
|
||||
}
|
||||
|
||||
function cleanup(dir: string): void {
|
||||
fs.rmSync(dir, { recursive: true, force: true });
|
||||
}
|
||||
|
||||
function makeContext(dir: string, backend?: IntelligenceBackend): AgentContext {
|
||||
return {
|
||||
project_path: dir,
|
||||
phase: 1,
|
||||
stage: "execute",
|
||||
specification: "Build a REST API for task management",
|
||||
config_path: path.join(dir, ".ciagent", "config.json"),
|
||||
backend,
|
||||
};
|
||||
}
|
||||
|
||||
describe("ExecutorAgent", () => {
|
||||
let dir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
dir = createTempDir();
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
cleanup(dir);
|
||||
});
|
||||
|
||||
it("returns honest failure without backend", async () => {
|
||||
const executor = new ExecutorAgent();
|
||||
const result = await executor.execute(makeContext(dir));
|
||||
expect(result.success).toBe(false);
|
||||
expect(result.error).toContain("intelligence backend");
|
||||
});
|
||||
|
||||
it("delegates to backend when available", async () => {
|
||||
const mockBackend = new MockBackend();
|
||||
const executor = new ExecutorAgent();
|
||||
const result = await executor.execute(makeContext(dir, mockBackend));
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("Mock backend executed");
|
||||
});
|
||||
|
||||
it("has correct agent name", () => {
|
||||
const executor = new ExecutorAgent();
|
||||
expect(executor.name).toBe("executor");
|
||||
});
|
||||
|
||||
it("has correct workflow", () => {
|
||||
const executor = new ExecutorAgent();
|
||||
expect(executor.workflow).toBe("execute");
|
||||
});
|
||||
});
|
||||
+163
-7
@@ -1,4 +1,21 @@
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
import { execSync } from "node:child_process";
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
|
||||
export interface ExecutorResult {
|
||||
success: boolean;
|
||||
tasksExecuted: number;
|
||||
tasksCommitted: number;
|
||||
testsPassing: boolean;
|
||||
mustHavesChecked: { name: string; passed: boolean }[];
|
||||
error?: string;
|
||||
}
|
||||
|
||||
interface MustHaveItem {
|
||||
name: string;
|
||||
passed: boolean;
|
||||
}
|
||||
|
||||
export class ExecutorAgent extends BaseAgent {
|
||||
readonly name = "executor";
|
||||
@@ -8,21 +25,160 @@ export class ExecutorAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Executing tasks...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
`Execute implementation for stage ${context.stage}, phase ${context.phase}. Specification: ${context.specification}`
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
const taskPrompt = await this.buildBackendTaskPrompt(context);
|
||||
const backendResult = await this.executeViaBackend(context, taskPrompt);
|
||||
|
||||
const verification = await this.verifyExecution(context);
|
||||
|
||||
return {
|
||||
...backendResult,
|
||||
output: `${backendResult.output}\nVerification: tests=${verification.testsPassing ? "passing" : "failing"}, must-haves checked=${verification.mustHavesChecked.length}`,
|
||||
duration_ms: Date.now() - start,
|
||||
};
|
||||
}
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Execution requires an intelligence backend. Configure one with: ci init --backend",
|
||||
output: "Executor requires intelligence backend for code implementation",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: "Executor requires intelligence backend for code implementation",
|
||||
};
|
||||
}
|
||||
|
||||
private async buildBackendTaskPrompt(context: AgentContext): Promise<string> {
|
||||
const parts: string[] = [
|
||||
`Execute implementation for stage ${context.stage}, phase ${context.phase}.`,
|
||||
"",
|
||||
"## Specification",
|
||||
context.specification || "No specification provided",
|
||||
];
|
||||
|
||||
const planContent = this.readPlanFile(context);
|
||||
if (planContent) {
|
||||
parts.push("", "## Plan", planContent);
|
||||
}
|
||||
|
||||
const ciDir = path.join(context.project_path, ".ciagent");
|
||||
const roadmapPath = path.join(ciDir, "ROADMAP.md");
|
||||
const archPath = path.join(ciDir, "ARCHITECTURE.md");
|
||||
|
||||
if (fs.existsSync(roadmapPath)) {
|
||||
try {
|
||||
const roadmap = fs.readFileSync(roadmapPath, "utf-8");
|
||||
parts.push("", "## Roadmap Context", roadmap.slice(0, 2000));
|
||||
} catch {}
|
||||
}
|
||||
|
||||
if (fs.existsSync(archPath)) {
|
||||
try {
|
||||
const arch = fs.readFileSync(archPath, "utf-8");
|
||||
parts.push("", "## Architecture Boundaries", arch.slice(0, 2000));
|
||||
} catch {}
|
||||
}
|
||||
|
||||
parts.push("", "## Execution Rules");
|
||||
parts.push("- Execute one task at a time");
|
||||
parts.push("- Commit after each task with ---ci--- block");
|
||||
parts.push("- Never pause for checkpoints");
|
||||
parts.push("- Create automated verification for traditionally human tasks");
|
||||
|
||||
return parts.join("\n");
|
||||
}
|
||||
|
||||
private readPlanFile(context: AgentContext): string | null {
|
||||
const planPath = path.join(context.project_path, ".ciagent", "PLAN.md");
|
||||
try {
|
||||
if (fs.existsSync(planPath)) {
|
||||
return fs.readFileSync(planPath, "utf-8");
|
||||
}
|
||||
} catch {}
|
||||
return null;
|
||||
}
|
||||
|
||||
private async verifyExecution(context: AgentContext): Promise<ExecutorResult> {
|
||||
const mustHavesChecked: MustHaveItem[] = this.checkMustHaves(context);
|
||||
let testsPassing = false;
|
||||
let tasksExecuted = 0;
|
||||
let tasksCommitted = 0;
|
||||
|
||||
try {
|
||||
const logOutput = execSync("git log --max-count=20 --oneline", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
}).trim();
|
||||
const commitLines = logOutput.split("\n").filter(Boolean);
|
||||
tasksCommitted = commitLines.filter((l) => /feat|fix|test/.test(l)).length;
|
||||
tasksExecuted = tasksCommitted;
|
||||
} catch {}
|
||||
|
||||
try {
|
||||
execSync("npm test", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
timeout: 120000,
|
||||
});
|
||||
testsPassing = true;
|
||||
} catch {
|
||||
testsPassing = false;
|
||||
}
|
||||
|
||||
return {
|
||||
success: mustHavesChecked.every((m) => m.passed) && testsPassing,
|
||||
tasksExecuted,
|
||||
tasksCommitted,
|
||||
testsPassing,
|
||||
mustHavesChecked,
|
||||
};
|
||||
}
|
||||
|
||||
private checkMustHaves(context: AgentContext): MustHaveItem[] {
|
||||
const planPath = path.join(context.project_path, ".ciagent", "PLAN.md");
|
||||
const results: MustHaveItem[] = [];
|
||||
|
||||
try {
|
||||
if (!fs.existsSync(planPath)) return results;
|
||||
const planContent = fs.readFileSync(planPath, "utf-8");
|
||||
const mustHaveRegex = /-\s*\[x\]\s*(.+)/g;
|
||||
let match;
|
||||
while ((match = mustHaveRegex.exec(planContent)) !== null) {
|
||||
const name = match[1].trim();
|
||||
const passed = this.verifyMustHaveItem(name, context);
|
||||
results.push({ name, passed });
|
||||
}
|
||||
} catch {}
|
||||
|
||||
return results;
|
||||
}
|
||||
|
||||
private verifyMustHaveItem(item: string, context: AgentContext): boolean {
|
||||
const fileMatch = item.match(/(?:exists|created?|present).*?[\s:]+([^\s]+\.(ts|js|json|md))/i);
|
||||
if (fileMatch) {
|
||||
const filePath = path.join(context.project_path, fileMatch[1]);
|
||||
return fs.existsSync(filePath);
|
||||
}
|
||||
|
||||
const testMatch = item.match(/(?:test|tests?)\s+(?:pass|passing)/i);
|
||||
if (testMatch) {
|
||||
try {
|
||||
execSync("npm test", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
timeout: 120000,
|
||||
});
|
||||
return true;
|
||||
} catch {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,27 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { IdeationAgent } from "../agents/ideation-agent.js";
|
||||
|
||||
describe("IdeationAgent", () => {
|
||||
it("agent name is ideation-agent", () => {
|
||||
const agent = new IdeationAgent();
|
||||
expect(agent.name).toBe("ideation-agent");
|
||||
});
|
||||
|
||||
it("workflow is research", () => {
|
||||
const agent = new IdeationAgent();
|
||||
expect(agent.workflow).toBe("research");
|
||||
});
|
||||
|
||||
it("delegates mechanicalIdeate to IdeationEngine", () => {
|
||||
const tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-agent-test-"));
|
||||
try {
|
||||
const agent = new IdeationAgent();
|
||||
const ideas = agent.mechanicalIdeate(tempDir);
|
||||
expect(Array.isArray(ideas)).toBe(true);
|
||||
} finally {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
}
|
||||
});
|
||||
});
|
||||
@@ -1,13 +1,15 @@
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
import { IdeationEngine } from "../core/ideation.js";
|
||||
|
||||
export class IdeationAgent extends BaseAgent {
|
||||
readonly name = "ideation-agent";
|
||||
readonly description = "Generates improvement ideas. Output feeds directly into planning pipeline.";
|
||||
readonly description = "Generates improvement ideas using git-native pattern mining, coverage gap analysis, and architectural drift detection. Output feeds directly into planning pipeline.";
|
||||
readonly workflow = "research";
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Generating improvement ideas...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +17,23 @@ export class IdeationAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const engine = new IdeationEngine(context.project_path);
|
||||
const ideas = engine.runMechanical();
|
||||
const output = engine.formatIdeas(ideas);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Ideation requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalIdeate(projectPath: string) {
|
||||
const engine = new IdeationEngine(projectPath);
|
||||
return engine.runMechanical();
|
||||
}
|
||||
}
|
||||
+7
-4
@@ -1,9 +1,9 @@
|
||||
export { BaseAgent, AgentContext, AgentResult, backendResultToAgentResult } from "./base.js";
|
||||
export { OrchestratorAgent } from "./orchestrator.js";
|
||||
export { PlannerAgent } from "./planner.js";
|
||||
export { ExecutorAgent } from "./executor.js";
|
||||
export { VerifierAgent } from "./verifier.js";
|
||||
export { ResearcherAgent } from "./researcher.js";
|
||||
export { PlannerAgent, PlannerResult } from "./planner.js";
|
||||
export { ExecutorAgent, ExecutorResult } from "./executor.js";
|
||||
export { VerifierAgent, VerifierResult } from "./verifier.js";
|
||||
export { ResearcherAgent, ResearcherResult } from "./researcher.js";
|
||||
export { ChallengerAgent } from "./challenger.js";
|
||||
export { SecurityAuditorAgent } from "./security-auditor.js";
|
||||
export { DebuggerAgent } from "./debugger.js";
|
||||
@@ -17,6 +17,7 @@ export { ProjectResearcherAgent } from "./project-researcher.js";
|
||||
export { ResearchSynthesizerAgent } from "./research-synthesizer.js";
|
||||
export { SolutionWriterAgent } from "./solution-writer.js";
|
||||
export { PhaseResearcherAgent } from "./phase-researcher.js";
|
||||
export { TesterAgent, TesterResult } from "./tester.js";
|
||||
|
||||
import { AgentName } from "../types/config.js";
|
||||
import { BaseAgent as BaseAgentType } from "./base.js";
|
||||
@@ -38,6 +39,7 @@ import { ProjectResearcherAgent } from "./project-researcher.js";
|
||||
import { ResearchSynthesizerAgent } from "./research-synthesizer.js";
|
||||
import { SolutionWriterAgent } from "./solution-writer.js";
|
||||
import { PhaseResearcherAgent } from "./phase-researcher.js";
|
||||
import { TesterAgent } from "./tester.js";
|
||||
|
||||
const agentRegistry: Record<AgentName, () => BaseAgentType> = {
|
||||
orchestrator: () => new OrchestratorAgent(),
|
||||
@@ -58,6 +60,7 @@ const agentRegistry: Record<AgentName, () => BaseAgentType> = {
|
||||
"project-researcher": () => new ProjectResearcherAgent(),
|
||||
"research-synthesizer": () => new ResearchSynthesizerAgent(),
|
||||
"solution-writer": () => new SolutionWriterAgent(),
|
||||
tester: () => new TesterAgent(),
|
||||
};
|
||||
|
||||
export function getAgent(name: AgentName): BaseAgentType {
|
||||
|
||||
+576
-72
@@ -4,9 +4,9 @@ import { ClarifyPhase } from "../core/clarify.js";
|
||||
import { EscalationProtocol, EscalationInput } from "../core/escalation.js";
|
||||
import { GitContext, ProjectState } from "../core/git-context.js";
|
||||
import { GitBranch } from "../core/git-branch.js";
|
||||
import { CiFiles } from "../core/ci-files.js";
|
||||
import { CIAgentFiles } from "../core/ciagent-files.js";
|
||||
import { CommitBuilder } from "../core/commit-builder.js";
|
||||
import { CIConfig, AgentName } from "../types/config.js";
|
||||
import { CIAgentConfig, AgentName } from "../types/config.js";
|
||||
import {
|
||||
PipelineState,
|
||||
PipelineStage,
|
||||
@@ -16,40 +16,46 @@ import {
|
||||
STAGE_ORDER,
|
||||
} from "../types/pipeline.js";
|
||||
import { Specification, parseSpecification } from "../types/specification.js";
|
||||
import { loadConfig, saveConfig, isCIInitialized, initCI } from "../core/config.js";
|
||||
import { loadConfig, saveConfig, isCIAgentInitialized, initCIAgent } from "../core/config.js";
|
||||
import { getAgent } from "./index.js";
|
||||
import { IntelligenceBackend, BackendUnavailableError } from "../backends/types.js";
|
||||
import { registerEscalationProtocol } from "../cli/index.js";
|
||||
import { execSync } from "node:child_process";
|
||||
|
||||
export interface GitAgentContext extends AgentContext {
|
||||
gitContext: GitContext;
|
||||
gitBranch: GitBranch;
|
||||
ciFiles: CiFiles;
|
||||
ciFiles: CIAgentFiles;
|
||||
milestone: string;
|
||||
}
|
||||
|
||||
export class OrchestratorAgent extends BaseAgent {
|
||||
readonly name: AgentName = "orchestrator";
|
||||
readonly description = "Top-level autonomous controller that coordinates the full CI pipeline";
|
||||
readonly description = "Top-level autonomous controller that coordinates the full CIAgent pipeline";
|
||||
readonly workflow = "run";
|
||||
|
||||
private config: CIConfig;
|
||||
private config: CIAgentConfig;
|
||||
private pipelineState: PipelineState | null = null;
|
||||
private decisionEngine: DecisionEngine | null = null;
|
||||
private escalationProtocol: EscalationProtocol | null = null;
|
||||
private gitContext: GitContext | null = null;
|
||||
private gitBranch: GitBranch | null = null;
|
||||
private ciFiles: CiFiles | null = null;
|
||||
private ciFiles: CIAgentFiles | null = null;
|
||||
private currentMilestone: string;
|
||||
private phaseResults: PhaseResult[] = [];
|
||||
private totalPhases: number = 1;
|
||||
|
||||
private static readonly STAGE_AGENT_MAP: Partial<Record<PipelineStage, AgentName>> = {
|
||||
research: "researcher",
|
||||
plan: "planner",
|
||||
execute: "executor",
|
||||
verify: "verifier",
|
||||
private static readonly STAGE_AGENT_MAP: Partial<Record<PipelineStage, AgentName[]>> = {
|
||||
research: ["researcher"],
|
||||
ideate: ["ideation-agent"],
|
||||
plan: ["planner"],
|
||||
execute: ["executor", "code-reviewer", "security-auditor"],
|
||||
test: ["tester"],
|
||||
verify: ["verifier"],
|
||||
complete: ["doc-writer"],
|
||||
};
|
||||
|
||||
constructor(config?: CIConfig) {
|
||||
constructor(config?: CIAgentConfig) {
|
||||
super();
|
||||
this.config = config || loadConfig(process.cwd());
|
||||
this.currentMilestone = "v1.0";
|
||||
@@ -57,14 +63,15 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const startTime = Date.now();
|
||||
this.log("Starting CI Orchestrator pipeline (git-native)");
|
||||
this.log("Starting CIAgent Orchestrator pipeline (git-native)");
|
||||
|
||||
try {
|
||||
this.config = loadConfig(context.project_path);
|
||||
|
||||
const projectSlug = context.project_slug || "";
|
||||
this.gitContext = new GitContext(context.project_path);
|
||||
this.gitBranch = new GitBranch(context.project_path);
|
||||
this.ciFiles = new CiFiles(context.project_path);
|
||||
this.ciFiles = new CIAgentFiles(context.project_path, projectSlug || undefined);
|
||||
this.ciFiles.ensureCIDir();
|
||||
|
||||
const projectState = this.gitContext.reconstructState();
|
||||
@@ -78,47 +85,67 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
this.pipelineState.current_stage = projectState.currentStage;
|
||||
}
|
||||
|
||||
this.totalPhases = this.deriveTotalPhases();
|
||||
this.log(`Total phases in milestone: ${this.totalPhases}`);
|
||||
|
||||
this.decisionEngine = new DecisionEngine(this.config, context.project_path, this.currentMilestone);
|
||||
this.escalationProtocol = new EscalationProtocol(this.config, context.project_path, this.currentMilestone);
|
||||
registerEscalationProtocol(this.escalationProtocol);
|
||||
|
||||
for (const stage of STAGE_ORDER) {
|
||||
this.log(`Entering stage: ${stage}`);
|
||||
this.pipelineState.current_stage = stage;
|
||||
this.pipelineState.last_updated = new Date().toISOString();
|
||||
while (this.pipelineState.current_phase <= this.totalPhases) {
|
||||
this.log(`Processing phase ${this.pipelineState.current_phase} of ${this.totalPhases}`);
|
||||
|
||||
const result = await this.executeStage(stage, context);
|
||||
for (const stage of STAGE_ORDER) {
|
||||
this.log(`Entering stage: ${stage}`);
|
||||
this.pipelineState.current_stage = stage;
|
||||
this.pipelineState.last_updated = new Date().toISOString();
|
||||
|
||||
if (!result.success && stage !== "complete") {
|
||||
this.pipelineState.errors.push({
|
||||
stage,
|
||||
phase: this.pipelineState.current_phase,
|
||||
message: result.error || "Stage failed",
|
||||
timestamp: new Date().toISOString(),
|
||||
retry_count: 0,
|
||||
resolved: false,
|
||||
});
|
||||
const result = await this.executeStageWithRecovery(stage, context);
|
||||
|
||||
if (stage === "specify" || stage === "clarify") {
|
||||
return {
|
||||
success: false,
|
||||
output: `Pipeline failed at ${stage}: ${result.error}`,
|
||||
artifacts_created: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.artifacts_created.length,
|
||||
0
|
||||
),
|
||||
decisions: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.decisions_made,
|
||||
0
|
||||
),
|
||||
escalations: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.escalations_raised,
|
||||
0
|
||||
),
|
||||
duration_ms: Date.now() - startTime,
|
||||
error: result.error,
|
||||
};
|
||||
this.phaseResults.push(result);
|
||||
this.recordPhaseResult(result);
|
||||
|
||||
if (!result.success && stage !== "complete") {
|
||||
this.pipelineState.errors.push({
|
||||
stage,
|
||||
phase: this.pipelineState.current_phase,
|
||||
message: result.error || "Stage failed",
|
||||
timestamp: new Date().toISOString(),
|
||||
retry_count: 0,
|
||||
resolved: false,
|
||||
});
|
||||
|
||||
if (stage === "specify" || stage === "clarify") {
|
||||
return {
|
||||
success: false,
|
||||
output: `Pipeline failed at ${stage}: ${result.error}`,
|
||||
artifacts_created: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.artifacts_created.length,
|
||||
0
|
||||
),
|
||||
decisions: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.decisions_made,
|
||||
0
|
||||
),
|
||||
escalations: this.phaseResults.reduce(
|
||||
(acc, r) => acc + r.escalations_raised,
|
||||
0
|
||||
),
|
||||
duration_ms: Date.now() - startTime,
|
||||
error: result.error,
|
||||
};
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (this.pipelineState.current_phase < this.totalPhases) {
|
||||
this.performPhaseBoundaryCheckpoint(context);
|
||||
this.pipelineState.current_phase++;
|
||||
this.pipelineState.current_stage = "specify";
|
||||
this.log(`Advancing to phase ${this.pipelineState.current_phase}`);
|
||||
} else {
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
const totalDuration = Date.now() - startTime;
|
||||
@@ -151,36 +178,270 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
duration_ms: Date.now() - startTime,
|
||||
error: err instanceof Error ? err.message : String(err),
|
||||
};
|
||||
} finally {
|
||||
this.escalationProtocol?.dispose();
|
||||
}
|
||||
}
|
||||
|
||||
private buildGitAgentContext(context: AgentContext): GitAgentContext {
|
||||
return {
|
||||
...context,
|
||||
gitContext: this.gitContext!,
|
||||
gitBranch: this.gitBranch!,
|
||||
ciFiles: this.ciFiles!,
|
||||
milestone: this.currentMilestone,
|
||||
};
|
||||
}
|
||||
|
||||
private recordPhaseResult(result: PhaseResult): void {
|
||||
for (const artifact of result.artifacts_created) {
|
||||
this.log(`Artifact created: ${artifact}`);
|
||||
}
|
||||
|
||||
if (result.decisions_made > 0 && this.decisionEngine) {
|
||||
this.decisionEngine.makeHighConfidenceDecision(
|
||||
`Agent reported ${result.decisions_made} decision(s) during ${result.stage}`,
|
||||
`Decisions recorded from ${result.stage} stage execution`,
|
||||
"general",
|
||||
[]
|
||||
);
|
||||
}
|
||||
|
||||
if (result.escalations_raised > 0 && this.escalationProtocol) {
|
||||
this.escalationProtocol.escalate({
|
||||
type: "low_confidence_decision",
|
||||
phase: String(this.pipelineState!.current_phase),
|
||||
description: `Agent reported ${result.escalations_raised} escalation(s) during ${result.stage}`,
|
||||
context: `Stage ${result.stage} raised escalations during execution`,
|
||||
options: [
|
||||
{ id: "proceed", label: "Proceed", description: "Continue pipeline execution", recommended: true },
|
||||
{ id: "halt", label: "Halt", description: "Stop pipeline and await manual review", recommended: false },
|
||||
],
|
||||
default_option_id: "proceed",
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
private deriveTotalPhases(): number {
|
||||
if (!this.ciFiles) return 1;
|
||||
const roadmap = this.ciFiles.readRoadmapMd();
|
||||
if (!roadmap || roadmap.phases.length === 0) return 1;
|
||||
return roadmap.phases.length;
|
||||
}
|
||||
|
||||
private performPhaseBoundaryCheckpoint(context: AgentContext): void {
|
||||
this.log(`Phase boundary checkpoint for phase ${this.pipelineState!.current_phase}`);
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
try {
|
||||
const message = `chore(P${String(this.pipelineState!.current_phase).padStart(2, "0")}): phase boundary checkpoint\n\n---ci---\nphase: ${this.pipelineState!.current_phase}\nmilestone: ${this.currentMilestone}\nstatus: complete\n---/ci---`;
|
||||
execSync(`git add -A && git commit -m "${message.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
} catch (err) {
|
||||
this.warn(`Phase boundary commit failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
|
||||
if (this.ciFiles) {
|
||||
this.ciFiles.updatePhaseStatus(this.pipelineState!.current_phase, "complete");
|
||||
|
||||
const reqs = this.ciFiles.readRequirementsMd();
|
||||
if (reqs) {
|
||||
for (const t of reqs.traceability) {
|
||||
if (t.phase === this.pipelineState!.current_phase && t.status === "in_progress") {
|
||||
this.ciFiles.updateRequirementStatus(t.requirement, "complete");
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (this.gitContext) {
|
||||
const verifiedState = this.gitContext.reconstructState();
|
||||
this.log(`Verified state: phase=${verifiedState.currentPhase}, milestone=${verifiedState.currentMilestone}, stage=${verifiedState.currentStage}`);
|
||||
}
|
||||
}
|
||||
|
||||
private async executeStageWithRecovery(
|
||||
stage: PipelineStage,
|
||||
context: AgentContext
|
||||
): Promise<PhaseResult> {
|
||||
try {
|
||||
const result = await this.executeStage(stage, context);
|
||||
if (result.success) return result;
|
||||
} catch (err) {
|
||||
this.warn(`First attempt failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
|
||||
this.log(`Retrying stage ${stage}...`);
|
||||
try {
|
||||
const result = await this.executeStage(stage, context);
|
||||
if (result.success) return result;
|
||||
} catch (err) {
|
||||
this.warn(`Retry failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
|
||||
if (context.backend) {
|
||||
this.log(`Attempting plan revision for failed stage ${stage}...`);
|
||||
try {
|
||||
const planner = getAgent("planner");
|
||||
const gitContext = this.buildGitAgentContext(context);
|
||||
const planResult = await planner.execute({
|
||||
...gitContext,
|
||||
specification: `Plan revision needed: stage ${stage} failed twice. Original error context: phase ${this.pipelineState!.current_phase}`,
|
||||
});
|
||||
if (planResult.success) {
|
||||
this.log(`Plan revision succeeded, retrying ${stage} with revised plan...`);
|
||||
try {
|
||||
const result = await this.executeStage(stage, context);
|
||||
if (result.success) return result;
|
||||
} catch (err) {
|
||||
this.warn(`Post-revision retry failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
} catch (err) {
|
||||
this.warn(`Plan revision failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
|
||||
if (this.escalationProtocol) {
|
||||
this.escalationProtocol.escalate({
|
||||
type: "verification_failure",
|
||||
phase: String(this.pipelineState!.current_phase),
|
||||
description: `Stage ${stage} failed after retry and plan revision attempts`,
|
||||
context: `All recovery attempts exhausted for stage ${stage} in phase ${this.pipelineState!.current_phase}`,
|
||||
options: [
|
||||
{ id: "skip", label: "Skip stage", description: "Continue pipeline skipping this stage", recommended: true },
|
||||
{ id: "abort", label: "Abort pipeline", description: "Stop the entire pipeline", recommended: false },
|
||||
],
|
||||
default_option_id: "skip",
|
||||
});
|
||||
}
|
||||
|
||||
return {
|
||||
phase: this.pipelineState!.current_phase,
|
||||
stage,
|
||||
success: false,
|
||||
artifacts_created: [],
|
||||
decisions_made: 0,
|
||||
escalations_raised: 1,
|
||||
duration_ms: 0,
|
||||
error: `Stage ${stage} failed after recovery attempts`,
|
||||
};
|
||||
}
|
||||
|
||||
private async executeStage(
|
||||
stage: PipelineStage,
|
||||
context: AgentContext
|
||||
): Promise<PhaseResult> {
|
||||
const stageStart = Date.now();
|
||||
const agentName = OrchestratorAgent.STAGE_AGENT_MAP[stage];
|
||||
const agentNames = OrchestratorAgent.STAGE_AGENT_MAP[stage];
|
||||
|
||||
if (agentName && context.backend) {
|
||||
this.log(`Delegating ${stage} to ${agentName} agent via backend...`);
|
||||
if (agentNames && agentNames.length > 0 && context.backend) {
|
||||
this.log(`Delegating ${stage} to ${agentNames.join(", ")} agent(s) via backend...`);
|
||||
try {
|
||||
const agent = getAgent(agentName);
|
||||
const result = await agent.execute(context);
|
||||
let primaryResult: AgentResult | null = null;
|
||||
const allArtifacts: string[] = [];
|
||||
let totalDecisions = 0;
|
||||
let totalEscalations = 0;
|
||||
let lastError: string | undefined;
|
||||
|
||||
const primaryAgent = getAgent(agentNames[0]);
|
||||
const gitContext = this.buildGitAgentContext(context);
|
||||
const primaryAgentResult = await primaryAgent.execute(gitContext);
|
||||
primaryResult = primaryAgentResult;
|
||||
if (Array.isArray(primaryAgentResult.artifacts_created)) {
|
||||
allArtifacts.push(...primaryAgentResult.artifacts_created);
|
||||
}
|
||||
totalDecisions += primaryAgentResult.decisions;
|
||||
totalEscalations += primaryAgentResult.escalations;
|
||||
|
||||
if (!primaryAgentResult.success) {
|
||||
this.warn(`Primary agent ${agentNames[0]} failed for ${stage}`);
|
||||
return {
|
||||
phase: this.pipelineState!.current_phase,
|
||||
stage,
|
||||
success: false,
|
||||
artifacts_created: allArtifacts,
|
||||
decisions_made: totalDecisions,
|
||||
escalations_raised: totalEscalations,
|
||||
duration_ms: Date.now() - stageStart,
|
||||
error: primaryAgentResult.error || `Primary agent ${agentNames[0]} failed`,
|
||||
};
|
||||
}
|
||||
|
||||
if (agentNames.length > 1) {
|
||||
if (this.config.parallelization?.enabled) {
|
||||
const reviewFactories = agentNames.slice(1).map((reviewAgentName) => {
|
||||
return () => {
|
||||
const agent = getAgent(reviewAgentName);
|
||||
const reviewContext: AgentContext = {
|
||||
...gitContext,
|
||||
specification: `${context.specification}\n\nPrimary agent (${agentNames[0]}) completed. Review context:\n- Success: ${primaryResult!.success}\n- Output: ${primaryResult!.output}\n- Artifacts: ${Array.isArray(primaryResult!.artifacts_created) ? primaryResult!.artifacts_created.join(", ") : String(primaryResult!.artifacts_created)}`,
|
||||
};
|
||||
return agent.execute(reviewContext);
|
||||
};
|
||||
});
|
||||
|
||||
const settled = await this.limitConcurrency(reviewFactories, this.config.parallelization?.max_concurrent_agents ?? 5);
|
||||
for (let si = 0; si < settled.length; si++) {
|
||||
const result = settled[si];
|
||||
if (result.status === "fulfilled") {
|
||||
const agentResult = result.value;
|
||||
if (Array.isArray(agentResult.artifacts_created)) allArtifacts.push(...agentResult.artifacts_created);
|
||||
totalDecisions += agentResult.decisions;
|
||||
totalEscalations += agentResult.escalations;
|
||||
if (!agentResult.success) {
|
||||
this.warn(`Review agent reported issues: ${agentResult.error || "unspecified"}`);
|
||||
lastError = agentResult.error;
|
||||
}
|
||||
} else {
|
||||
this.warn(`Review agent failed: ${result.reason instanceof Error ? result.reason.message : String(result.reason)}`);
|
||||
}
|
||||
}
|
||||
} else {
|
||||
for (let i = 1; i < agentNames.length; i++) {
|
||||
const reviewAgentName = agentNames[i];
|
||||
try {
|
||||
const reviewAgent = getAgent(reviewAgentName);
|
||||
const reviewContext: AgentContext = {
|
||||
...gitContext,
|
||||
specification: `${context.specification}\n\nPrimary agent (${agentNames[0]}) completed. Review context:\n- Success: ${primaryResult!.success}\n- Output: ${primaryResult!.output}\n- Artifacts: ${Array.isArray(primaryResult!.artifacts_created) ? primaryResult!.artifacts_created.join(", ") : String(primaryResult!.artifacts_created)}`,
|
||||
};
|
||||
const result = await reviewAgent.execute(reviewContext);
|
||||
if (Array.isArray(result.artifacts_created)) {
|
||||
allArtifacts.push(...result.artifacts_created);
|
||||
}
|
||||
totalDecisions += result.decisions;
|
||||
totalEscalations += result.escalations;
|
||||
|
||||
if (!result.success) {
|
||||
this.warn(`Review agent ${reviewAgentName} reported issues for ${stage}: ${result.error || "unspecified"}`);
|
||||
lastError = result.error;
|
||||
}
|
||||
} catch (err) {
|
||||
this.warn(`Review agent ${reviewAgentName} failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return {
|
||||
phase: this.pipelineState!.current_phase,
|
||||
stage,
|
||||
success: result.success,
|
||||
artifacts_created: Array.isArray(result.artifacts_created) ? result.artifacts_created : [],
|
||||
decisions_made: result.decisions,
|
||||
escalations_raised: result.escalations,
|
||||
success: primaryResult?.success ?? false,
|
||||
artifacts_created: allArtifacts,
|
||||
decisions_made: totalDecisions,
|
||||
escalations_raised: totalEscalations,
|
||||
duration_ms: Date.now() - stageStart,
|
||||
error: result.error,
|
||||
error: lastError,
|
||||
};
|
||||
} catch (err) {
|
||||
if (err instanceof BackendUnavailableError) {
|
||||
this.warn(`Backend unavailable for ${stage}, falling back to mechanical execution`);
|
||||
} else {
|
||||
this.warn(`Agent ${agentName} failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
this.warn(`Agents failed for ${stage}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -200,6 +461,7 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
projectName: spec.objective.slice(0, 30),
|
||||
phaseCount: 0,
|
||||
milestone: this.currentMilestone,
|
||||
project: context.project_slug || undefined,
|
||||
specification: spec.raw_content,
|
||||
requirements: spec.requirements,
|
||||
constraints: spec.constraints,
|
||||
@@ -207,11 +469,10 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
});
|
||||
|
||||
this.log("Init commit prepared with specification in ---ci--- block");
|
||||
artifactsCreated.push(".ci/config.json");
|
||||
artifactsCreated.push(".ciagent/config.json");
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
try {
|
||||
const { execSync } = await import("node:child_process");
|
||||
this.ciFiles!.writeProjectMd({
|
||||
name: spec.objective.slice(0, 30),
|
||||
coreValue: spec.objective,
|
||||
@@ -274,7 +535,7 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
case "research": {
|
||||
this.log("Researching project domain...");
|
||||
this.decisionEngine!.setPhase(1);
|
||||
this.decisionEngine!.setPhase(this.pipelineState!.current_phase);
|
||||
|
||||
const archMd = this.ciFiles!.readArchitectureMd();
|
||||
if (!archMd) {
|
||||
@@ -293,13 +554,12 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
const researchCommit = CommitBuilder.buildResearchCommit(
|
||||
1,
|
||||
this.pipelineState!.current_phase,
|
||||
this.currentMilestone,
|
||||
"initial domain research",
|
||||
["Research completed. Key findings in .ci/ARCHITECTURE.md and .ci/PROJECT.md updates."]
|
||||
["Research completed. Key findings in .ciagent/ARCHITECTURE.md and .ciagent/PROJECT.md updates."]
|
||||
);
|
||||
try {
|
||||
const { execSync } = await import("node:child_process");
|
||||
execSync(`git add -A && git commit -m "${researchCommit.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
@@ -310,7 +570,70 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
}
|
||||
|
||||
this.pipelineState!.research_completed = true;
|
||||
artifactsCreated.push(".ci/ARCHITECTURE.md");
|
||||
artifactsCreated.push(".ciagent/ARCHITECTURE.md");
|
||||
break;
|
||||
}
|
||||
|
||||
case "ideate": {
|
||||
this.log("Running ideation stage...");
|
||||
const { IdeationEngine } = await import("../core/ideation.js");
|
||||
const ideationEngine = new IdeationEngine(context.project_path, context.project_slug || undefined);
|
||||
const ideas = ideationEngine.runMechanical();
|
||||
|
||||
const ideationConfig = this.config.ideation;
|
||||
if (ideationConfig?.categories && ideationConfig.categories.length > 0) {
|
||||
const categoryIdeas = ideationEngine.runMechanical(ideationConfig.categories);
|
||||
const seenTitles = new Set(ideas.map((i) => i.title));
|
||||
for (const idea of categoryIdeas) {
|
||||
if (!seenTitles.has(idea.title)) {
|
||||
ideas.push(idea);
|
||||
seenTitles.add(idea.title);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
ideas.sort((a, b) => b.confidence - a.confidence);
|
||||
|
||||
const maxIdeas = ideationConfig?.max_ideas || 20;
|
||||
const trimmedIdeas = ideas.slice(0, maxIdeas);
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
const { accepted: savedIdeas, results } = ideationEngine.acceptIdeas(trimmedIdeas);
|
||||
const savedCount = results.filter((r) => r.addedToRequirements || r.addedToRoadmap).length;
|
||||
|
||||
const ideationCommit = CommitBuilder.buildTaskCommit({
|
||||
type: "decision",
|
||||
phase: this.pipelineState!.current_phase,
|
||||
milestone: this.currentMilestone,
|
||||
project: context.project_slug || undefined,
|
||||
plan: "ideation",
|
||||
task: "ideation-results",
|
||||
subject: `ideation results — ${trimmedIdeas.length} total, ${savedCount} accepted`,
|
||||
status: "ideate",
|
||||
decisions: savedIdeas.map((idea) => ({
|
||||
id: idea.id,
|
||||
decision: idea.title,
|
||||
rationale: idea.rationale,
|
||||
confidence: idea.confidence,
|
||||
alternatives: idea.actions,
|
||||
})),
|
||||
});
|
||||
|
||||
try {
|
||||
execSync(`git add -A && git commit -m "${ideationCommit.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
} catch (err) {
|
||||
this.warn(`Ideation commit failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
|
||||
artifactsCreated.push(".ciagent/REQUIREMENTS.md", ".ciagent/ROADMAP.md");
|
||||
decisionsMade += savedCount;
|
||||
}
|
||||
|
||||
this.pipelineState!.ideate_completed = true;
|
||||
this.log(`Ideation stage complete: ${trimmedIdeas.length} ideas generated`);
|
||||
break;
|
||||
}
|
||||
|
||||
@@ -318,7 +641,7 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
this.log("Planning phase execution...");
|
||||
|
||||
if (this.config.git.branching_strategy === "phase" && this.gitBranch && this.gitContext!.isGitRepo()) {
|
||||
this.gitBranch.createPhaseBranch(1, "initial-phase");
|
||||
this.gitBranch.createPhaseBranch(this.pipelineState!.current_phase, "initial-phase");
|
||||
}
|
||||
|
||||
this.pipelineState!.plan_completed = true;
|
||||
@@ -342,6 +665,38 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
this.pipelineState!.execute_completed = true;
|
||||
break;
|
||||
|
||||
case "test": {
|
||||
this.log("Running tests...");
|
||||
if (!context.backend) {
|
||||
this.log("No backend available — running mechanical test fallback via npm test");
|
||||
try {
|
||||
const testOutput = execSync("npm test", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
timeout: 120000,
|
||||
});
|
||||
this.log("npm test passed");
|
||||
this.pipelineState!.test_completed = true;
|
||||
artifactsCreated.push("test-results");
|
||||
} catch (err) {
|
||||
const errMsg = err instanceof Error ? err.message : String(err);
|
||||
this.warn(`npm test failed: ${errMsg}`);
|
||||
return {
|
||||
phase: this.pipelineState!.current_phase,
|
||||
stage: "test",
|
||||
success: false,
|
||||
artifacts_created: artifactsCreated,
|
||||
decisions_made: decisionsMade,
|
||||
escalations_raised: escalationsRaised,
|
||||
duration_ms: Date.now() - stageStart,
|
||||
error: `Test stage failed: ${errMsg}`,
|
||||
};
|
||||
}
|
||||
}
|
||||
break;
|
||||
}
|
||||
|
||||
case "verify": {
|
||||
this.log("Running verification...");
|
||||
|
||||
@@ -366,13 +721,12 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
const verifyCommit = CommitBuilder.buildVerifyCommit({
|
||||
phase: 1,
|
||||
phase: this.pipelineState!.current_phase,
|
||||
milestone: this.currentMilestone,
|
||||
subject: "automated verification passed",
|
||||
requirements: { covered: [], partial: [] },
|
||||
});
|
||||
try {
|
||||
const { execSync } = await import("node:child_process");
|
||||
execSync(`git add -A && git commit -m "${verifyCommit.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
@@ -390,7 +744,7 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
if (this.config.git.auto_commit && this.gitContext!.isGitRepo()) {
|
||||
const completionCommit = CommitBuilder.buildPhaseCompletionCommit({
|
||||
phase: 1,
|
||||
phase: this.pipelineState!.current_phase,
|
||||
milestone: this.currentMilestone,
|
||||
phaseName: "initial-phase",
|
||||
tasksCompleted: 0,
|
||||
@@ -398,7 +752,6 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
taskNames: [],
|
||||
});
|
||||
try {
|
||||
const { execSync } = await import("node:child_process");
|
||||
execSync(`git add -A && git commit -m "${completionCommit.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
@@ -408,6 +761,30 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
}
|
||||
}
|
||||
|
||||
const versionTag = `${this.currentMilestone}-P${String(this.pipelineState!.current_phase).padStart(2, "0")}`;
|
||||
try {
|
||||
execSync(`git tag "${versionTag}"`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
this.log(`Created version tag: ${versionTag}`);
|
||||
artifactsCreated.push(`tag:${versionTag}`);
|
||||
} catch (err) {
|
||||
this.warn(`Version tag creation failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
|
||||
if (this.config.git.auto_push && this.gitContext!.isGitRepo()) {
|
||||
try {
|
||||
execSync(`git push origin ${versionTag}`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
this.log(`Pushed version tag: ${versionTag}`);
|
||||
} catch (err) {
|
||||
this.warn(`Version tag push failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
|
||||
break;
|
||||
}
|
||||
}
|
||||
@@ -423,9 +800,41 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
};
|
||||
}
|
||||
|
||||
private async limitConcurrency<T>(
|
||||
factories: Array<() => Promise<T>>,
|
||||
maxConcurrency: number
|
||||
): Promise<PromiseSettledResult<T>[]> {
|
||||
if (factories.length === 0) {
|
||||
return [];
|
||||
}
|
||||
|
||||
if (maxConcurrency <= 0 || maxConcurrency >= factories.length) {
|
||||
return Promise.allSettled(factories.map((f) => f()));
|
||||
}
|
||||
|
||||
const results: Array<PromiseSettledResult<T> | undefined> = new Array(factories.length).fill(undefined);
|
||||
let nextIndex = 0;
|
||||
|
||||
const worker = async () => {
|
||||
while (nextIndex < factories.length) {
|
||||
const index = nextIndex++;
|
||||
try {
|
||||
const value = await factories[index]();
|
||||
results[index] = { status: "fulfilled", value };
|
||||
} catch (reason) {
|
||||
results[index] = { status: "rejected", reason };
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
const workers = Array(Math.min(maxConcurrency, factories.length)).fill(null).map(() => worker());
|
||||
await Promise.all(workers);
|
||||
return results as PromiseSettledResult<T>[];
|
||||
}
|
||||
|
||||
private generateCompletionReport(): string {
|
||||
const lines: string[] = [
|
||||
"# CI Completion Report",
|
||||
"# CIAgent Completion Report",
|
||||
"",
|
||||
`✓ Pipeline completed successfully (git-native)`,
|
||||
"",
|
||||
@@ -447,4 +856,99 @@ export class OrchestratorAgent extends BaseAgent {
|
||||
|
||||
return lines.join("\n");
|
||||
}
|
||||
|
||||
async runForProject(projectSlug: string, context: AgentContext): Promise<AgentResult> {
|
||||
this.log(`Running pipeline for project: ${projectSlug}`);
|
||||
|
||||
this.ciFiles = new CIAgentFiles(context.project_path, projectSlug);
|
||||
this.ciFiles.ensureCIDir();
|
||||
this.ciFiles.setProjectSlug(projectSlug);
|
||||
|
||||
const projectContext: AgentContext = {
|
||||
...context,
|
||||
project_path: context.project_path,
|
||||
};
|
||||
|
||||
const result = await this.execute(projectContext);
|
||||
|
||||
return {
|
||||
...result,
|
||||
output: result.output ? `[${projectSlug}] ${result.output}` : result.output,
|
||||
};
|
||||
}
|
||||
|
||||
async runForAllProjects(context: AgentContext): Promise<Record<string, AgentResult>> {
|
||||
const config = loadConfig(context.project_path);
|
||||
const ciFiles = new CIAgentFiles(context.project_path);
|
||||
const projects = ciFiles.listProjects();
|
||||
|
||||
const activeProjects: string[] = config.active_projects?.length > 0
|
||||
? config.active_projects
|
||||
: projects.map((p) => p.slug);
|
||||
|
||||
if (activeProjects.length === 0) {
|
||||
this.log("No active projects found; running for default project");
|
||||
const result = await this.execute(context);
|
||||
return { default: result };
|
||||
}
|
||||
|
||||
this.log(`Running pipeline for ${activeProjects.length} project(s): ${activeProjects.join(", ")}`);
|
||||
|
||||
const results: Record<string, AgentResult> = {};
|
||||
const maxConcurrent = config.parallelization?.max_concurrent_projects ?? 3;
|
||||
const parallel = config.parallelization?.enabled && activeProjects.length > 1;
|
||||
|
||||
if (parallel) {
|
||||
const limitedConcurrency = Math.min(maxConcurrent, activeProjects.length);
|
||||
const batches: string[][] = [];
|
||||
for (let i = 0; i < activeProjects.length; i += limitedConcurrency) {
|
||||
batches.push(activeProjects.slice(i, i + limitedConcurrency));
|
||||
}
|
||||
|
||||
for (const batch of batches) {
|
||||
const batchResults = await Promise.allSettled(
|
||||
batch.map(async (slug): Promise<[string, AgentResult]> => {
|
||||
const orchestrator = new OrchestratorAgent(config);
|
||||
const result = await orchestrator.runForProject(slug, context);
|
||||
return [slug, result];
|
||||
})
|
||||
);
|
||||
|
||||
for (const settled of batchResults) {
|
||||
if (settled.status === "fulfilled") {
|
||||
const [slug, result] = settled.value;
|
||||
results[slug] = result;
|
||||
} else {
|
||||
this.warn(`Project pipeline failed: ${settled.reason instanceof Error ? settled.reason.message : String(settled.reason)}`);
|
||||
}
|
||||
}
|
||||
}
|
||||
} else {
|
||||
for (const slug of activeProjects) {
|
||||
this.log(`Processing project: ${slug}`);
|
||||
const orchestrator = new OrchestratorAgent(config);
|
||||
orchestrator.ciFiles = new CIAgentFiles(context.project_path, slug);
|
||||
orchestrator.ciFiles.ensureCIDir();
|
||||
orchestrator.ciFiles.setProjectSlug(slug);
|
||||
|
||||
try {
|
||||
const result = await orchestrator.runForProject(slug, context);
|
||||
results[slug] = result;
|
||||
} catch (err) {
|
||||
this.warn(`Failed for project ${slug}: ${err instanceof Error ? err.message : String(err)}`);
|
||||
results[slug] = {
|
||||
success: false,
|
||||
output: `Pipeline failed for project ${slug}`,
|
||||
artifacts_created: 0,
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: 0,
|
||||
error: err instanceof Error ? err.message : String(err),
|
||||
};
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return results;
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,217 @@
|
||||
async function limitConcurrency<T>(
|
||||
factories: Array<() => Promise<T>>,
|
||||
maxConcurrency: number
|
||||
): Promise<PromiseSettledResult<T>[]> {
|
||||
if (factories.length === 0) {
|
||||
return [];
|
||||
}
|
||||
|
||||
if (maxConcurrency <= 0 || maxConcurrency >= factories.length) {
|
||||
return Promise.allSettled(factories.map((f) => f()));
|
||||
}
|
||||
|
||||
const results: Array<PromiseSettledResult<T> | undefined> = new Array(factories.length).fill(undefined);
|
||||
let nextIndex = 0;
|
||||
|
||||
const worker = async () => {
|
||||
while (nextIndex < factories.length) {
|
||||
const index = nextIndex++;
|
||||
try {
|
||||
const value = await factories[index]();
|
||||
results[index] = { status: "fulfilled", value };
|
||||
} catch (reason) {
|
||||
results[index] = { status: "rejected", reason };
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
const workers = Array(Math.min(maxConcurrency, factories.length)).fill(null).map(() => worker());
|
||||
await Promise.all(workers);
|
||||
return results as PromiseSettledResult<T>[];
|
||||
}
|
||||
|
||||
function delay(ms: number): Promise<void> {
|
||||
return new Promise((resolve) => setTimeout(resolve, ms));
|
||||
}
|
||||
|
||||
describe("Parallel Execution", () => {
|
||||
describe("limitConcurrency", () => {
|
||||
it("returns empty array for zero factories", async () => {
|
||||
const results = await limitConcurrency([], 5);
|
||||
expect(results).toEqual([]);
|
||||
});
|
||||
|
||||
it("returns single-element result for one factory", async () => {
|
||||
const results = await limitConcurrency([() => Promise.resolve(42)], 5);
|
||||
expect(results).toHaveLength(1);
|
||||
expect(results[0].status).toBe("fulfilled");
|
||||
if (results[0].status === "fulfilled") {
|
||||
expect(results[0].value).toBe(42);
|
||||
}
|
||||
});
|
||||
|
||||
it("behaves sequentially when maxConcurrency=1", async () => {
|
||||
const order: number[] = [];
|
||||
|
||||
const factories = [1, 2, 3].map((n) => () =>
|
||||
delay(30).then(() => { order.push(n); return n; })
|
||||
);
|
||||
|
||||
const start = Date.now();
|
||||
const results = await limitConcurrency(factories, 1);
|
||||
const elapsed = Date.now() - start;
|
||||
|
||||
expect(results).toHaveLength(3);
|
||||
for (const r of results) {
|
||||
expect(r.status).toBe("fulfilled");
|
||||
}
|
||||
expect(order).toEqual([1, 2, 3]);
|
||||
expect(elapsed).toBeGreaterThanOrEqual(80);
|
||||
});
|
||||
|
||||
it("runs concurrently when maxConcurrency exceeds factory count", async () => {
|
||||
const factories = ["a", "b"].map((v) => () =>
|
||||
delay(50).then(() => v)
|
||||
);
|
||||
|
||||
const start = Date.now();
|
||||
const results = await limitConcurrency(factories, 10);
|
||||
const elapsed = Date.now() - start;
|
||||
|
||||
expect(results).toHaveLength(2);
|
||||
expect(elapsed).toBeLessThan(120);
|
||||
});
|
||||
|
||||
it("limits to maxConcurrency=2 with 4 factories", async () => {
|
||||
const timestamps: number[] = [];
|
||||
|
||||
const factories = [0, 1, 2, 3].map((i) => () =>
|
||||
delay(80).then(() => { timestamps.push(i); return i; })
|
||||
);
|
||||
|
||||
const start = Date.now();
|
||||
const results = await limitConcurrency(factories, 2);
|
||||
const elapsed = Date.now() - start;
|
||||
|
||||
expect(results).toHaveLength(4);
|
||||
for (const r of results) {
|
||||
expect(r.status).toBe("fulfilled");
|
||||
if (r.status === "fulfilled") {
|
||||
expect([0, 1, 2, 3]).toContain(r.value);
|
||||
}
|
||||
}
|
||||
|
||||
expect(elapsed).toBeGreaterThanOrEqual(150);
|
||||
expect(elapsed).toBeLessThan(350);
|
||||
});
|
||||
|
||||
it("isolates rejected promises from fulfilled ones", async () => {
|
||||
const factories = [
|
||||
() => Promise.resolve("success"),
|
||||
() => Promise.reject(new Error("boom")),
|
||||
() => Promise.resolve("also-success"),
|
||||
];
|
||||
|
||||
const results = await limitConcurrency(factories, 5);
|
||||
|
||||
expect(results).toHaveLength(3);
|
||||
const fulfilled = results.filter((r) => r.status === "fulfilled");
|
||||
const rejected = results.filter((r) => r.status === "rejected");
|
||||
expect(fulfilled).toHaveLength(2);
|
||||
expect(rejected).toHaveLength(1);
|
||||
|
||||
if (fulfilled[0].status === "fulfilled") {
|
||||
expect(fulfilled[0].value).toBe("success");
|
||||
}
|
||||
if (fulfilled[1].status === "fulfilled") {
|
||||
expect(fulfilled[1].value).toBe("also-success");
|
||||
}
|
||||
if (rejected[0].status === "rejected") {
|
||||
expect((rejected[0].reason as Error).message).toBe("boom");
|
||||
}
|
||||
});
|
||||
|
||||
it("handles maxConcurrency=0 as no limit", async () => {
|
||||
const factories = [1, 2, 3].map((v) => () => Promise.resolve(v));
|
||||
const results = await limitConcurrency(factories, 0);
|
||||
expect(results).toHaveLength(3);
|
||||
for (const r of results) {
|
||||
expect(r.status).toBe("fulfilled");
|
||||
}
|
||||
});
|
||||
});
|
||||
|
||||
describe("parallel vs sequential timing", () => {
|
||||
it("parallel execution is faster than sequential", async () => {
|
||||
const DELAY_MS = 50;
|
||||
const parallelFactories = [DELAY_MS, DELAY_MS].map((ms) => () => delay(ms));
|
||||
|
||||
const parallelStart = Date.now();
|
||||
const parallelResults = await limitConcurrency(parallelFactories, 5);
|
||||
const parallelElapsed = Date.now() - parallelStart;
|
||||
|
||||
const sequentialStart = Date.now();
|
||||
for (const ms of [DELAY_MS, DELAY_MS]) {
|
||||
await delay(ms);
|
||||
}
|
||||
const sequentialElapsed = Date.now() - sequentialStart;
|
||||
|
||||
expect(parallelResults).toHaveLength(2);
|
||||
expect(parallelElapsed).toBeLessThan(sequentialElapsed);
|
||||
expect(parallelElapsed).toBeLessThan(DELAY_MS * 1.8);
|
||||
});
|
||||
});
|
||||
|
||||
describe("concurrency limit verification", () => {
|
||||
it("at most maxConcurrency agents run simultaneously", async () => {
|
||||
let concurrentCount = 0;
|
||||
let maxConcurrent = 0;
|
||||
const MAX = 2;
|
||||
|
||||
const factories = [0, 1, 2, 3].map(
|
||||
(i) => () =>
|
||||
new Promise<number>((resolve) => {
|
||||
concurrentCount++;
|
||||
if (concurrentCount > maxConcurrent) maxConcurrent = concurrentCount;
|
||||
delay(60).then(() => {
|
||||
concurrentCount--;
|
||||
resolve(i);
|
||||
});
|
||||
})
|
||||
);
|
||||
|
||||
const results = await limitConcurrency(factories, MAX);
|
||||
|
||||
expect(results).toHaveLength(4);
|
||||
expect(maxConcurrent).toBeLessThanOrEqual(MAX);
|
||||
});
|
||||
});
|
||||
|
||||
describe("sequential fallback behavior", () => {
|
||||
it("runs agents in order when parallelization disabled", async () => {
|
||||
const executionOrder: string[] = [];
|
||||
|
||||
await (async () => {
|
||||
for (const name of ["code-reviewer", "security-auditor"]) {
|
||||
executionOrder.push(`start:${name}`);
|
||||
await delay(10);
|
||||
executionOrder.push(`end:${name}`);
|
||||
}
|
||||
})();
|
||||
|
||||
expect(executionOrder).toEqual([
|
||||
"start:code-reviewer",
|
||||
"end:code-reviewer",
|
||||
"start:security-auditor",
|
||||
"end:security-auditor",
|
||||
]);
|
||||
});
|
||||
});
|
||||
|
||||
describe("single agent edge case", () => {
|
||||
it("no review agents means no parallel code path triggered", async () => {
|
||||
const results = await limitConcurrency([], 5);
|
||||
expect(results).toHaveLength(0);
|
||||
});
|
||||
});
|
||||
});
|
||||
@@ -0,0 +1,74 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { PhaseResearcherAgent } from "../agents/phase-researcher.js";
|
||||
|
||||
describe("PhaseResearcherAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-phase-researcher-test-"));
|
||||
fs.mkdirSync(path.join(tempDir, ".git"), { recursive: true });
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("extracts decisions from commit log content", () => {
|
||||
const agent = new PhaseResearcherAgent();
|
||||
const result = agent.extractDecisions(
|
||||
`some commit\n---ci---\nphase: 1\ndecisions:\n - D-101: Use SQLite for storage confidence: 0.9\n - D-102: Retry on failure confidence: 0.3\n---/ci---\n`
|
||||
);
|
||||
|
||||
expect(result.length).toBe(2);
|
||||
expect(result[0].id).toBe("D-101");
|
||||
expect(result[0].confidence).toBe(0.9);
|
||||
expect(result[1].id).toBe("D-102");
|
||||
expect(result[1].confidence).toBe(0.3);
|
||||
});
|
||||
|
||||
it("extracts lessons from commit log content", () => {
|
||||
const agent = new PhaseResearcherAgent();
|
||||
const result = agent.extractLessons(
|
||||
`some commit\n---ci---\nphase: 1\nlessons:\n - testing: Flaky tests are a problem\n - build: CI timeouts\n---/ci---\n`
|
||||
);
|
||||
|
||||
expect(result.length).toBe(2);
|
||||
expect(result[0]).toContain("testing");
|
||||
});
|
||||
|
||||
it("identifies risks from low-confidence decisions and repeated lessons", () => {
|
||||
const agent = new PhaseResearcherAgent();
|
||||
const decisions = [
|
||||
{ id: "D-1", decision: "Risky choice", confidence: 0.4 },
|
||||
{ id: "D-2", decision: "Safe choice", confidence: 0.9 },
|
||||
];
|
||||
const lessons = [
|
||||
"testing: Flaky tests",
|
||||
"testing: More flaky tests",
|
||||
"build: CI timeouts",
|
||||
];
|
||||
|
||||
const risks = agent.identifyRisks(decisions, lessons);
|
||||
|
||||
const highRisk = risks.filter((r) => r.severity === "high");
|
||||
expect(highRisk.length).toBeGreaterThan(0);
|
||||
expect(highRisk.some((r) => r.description.includes("D-1"))).toBe(true);
|
||||
});
|
||||
|
||||
it("handles empty git log gracefully", () => {
|
||||
const agent = new PhaseResearcherAgent();
|
||||
const result = agent.mechanicalPhaseResearch(tempDir, 1);
|
||||
|
||||
expect(result.phase).toBe(1);
|
||||
expect(result.decisions).toEqual([]);
|
||||
expect(result.lessons).toEqual([]);
|
||||
expect(result.risks).toEqual([]);
|
||||
});
|
||||
|
||||
it("agent name is phase-researcher", () => {
|
||||
const agent = new PhaseResearcherAgent();
|
||||
expect(agent.name).toBe("phase-researcher");
|
||||
});
|
||||
});
|
||||
@@ -1,5 +1,14 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface PhaseResearchResult {
|
||||
phase: number;
|
||||
decisions: Array<{ id: string; decision: string; confidence: number }>;
|
||||
lessons: string[];
|
||||
risks: Array<{ description: string; severity: string }>;
|
||||
}
|
||||
|
||||
export class PhaseResearcherAgent extends BaseAgent {
|
||||
readonly name = "phase-researcher";
|
||||
readonly description = "Researches how to implement a specific phase well.";
|
||||
@@ -8,6 +17,7 @@ export class PhaseResearcherAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Researching phase implementation...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +25,130 @@ export class PhaseResearcherAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const result = this.mechanicalPhaseResearch(context.project_path, context.phase);
|
||||
const output = this.formatResult(result);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Phase research requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: result.risks.filter((r) => r.severity === "high").length,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalPhaseResearch(projectPath: string, phase: number): PhaseResearchResult {
|
||||
const logContent = this.readPhaseGitLog(projectPath, phase);
|
||||
const decisions = this.extractDecisions(logContent);
|
||||
const lessons = this.extractLessons(logContent);
|
||||
const risks = this.identifyRisks(decisions, lessons);
|
||||
|
||||
return { phase, decisions, lessons, risks };
|
||||
}
|
||||
|
||||
readPhaseGitLog(projectPath: string, phase: number): string {
|
||||
try {
|
||||
const { execSync } = require("node:child_process");
|
||||
return execSync(
|
||||
`git log --all --format="%B" -100`,
|
||||
{ cwd: projectPath, encoding: "utf-8", timeout: 5000 }
|
||||
);
|
||||
} catch {
|
||||
return "";
|
||||
}
|
||||
}
|
||||
|
||||
extractDecisions(logContent: string): Array<{ id: string; decision: string; confidence: number }> {
|
||||
const decisions: Array<{ id: string; decision: string; confidence: number }> = [];
|
||||
const decisionRegex = /(?:decisions|decision):\s*\n((?:\s+-\s+.+\n?)+)/g;
|
||||
let match;
|
||||
while ((match = decisionRegex.exec(logContent)) !== null) {
|
||||
const items = match[1].split("\n").filter((l: string) => l.trim().startsWith("-"));
|
||||
for (const item of items) {
|
||||
const text = item.replace(/^\s*-\s*/, "").trim();
|
||||
const idMatch = text.match(/D-(\d+)/);
|
||||
const id = idMatch ? `D-${idMatch[1]}` : `D-${decisions.length + 1}`;
|
||||
const confMatch = text.match(/confidence[:\s]+(\d+\.?\d*)/);
|
||||
const confidence = confMatch ? parseFloat(confMatch[1]) : 0.5;
|
||||
decisions.push({ id, decision: text, confidence });
|
||||
}
|
||||
}
|
||||
return decisions;
|
||||
}
|
||||
|
||||
extractLessons(logContent: string): string[] {
|
||||
const lessons: string[] = [];
|
||||
const lessonsRegex = /lessons:\s*\n((?:\s+-\s+.+\n?)+)/g;
|
||||
let match;
|
||||
while ((match = lessonsRegex.exec(logContent)) !== null) {
|
||||
const items = match[1].split("\n").filter((l: string) => l.trim().startsWith("-"));
|
||||
for (const item of items) {
|
||||
lessons.push(item.replace(/^\s*-\s*/, "").trim());
|
||||
}
|
||||
}
|
||||
return lessons;
|
||||
}
|
||||
|
||||
identifyRisks(
|
||||
decisions: Array<{ id: string; decision: string; confidence: number }>,
|
||||
lessons: string[]
|
||||
): Array<{ description: string; severity: string }> {
|
||||
const risks: Array<{ description: string; severity: string }> = [];
|
||||
|
||||
for (const decision of decisions) {
|
||||
if (decision.confidence < 0.5) {
|
||||
risks.push({
|
||||
description: `Low-confidence decision ${decision.id}: ${decision.decision.substring(0, 60)}`,
|
||||
severity: "high",
|
||||
});
|
||||
} else if (decision.confidence < 0.7) {
|
||||
risks.push({
|
||||
description: `Medium-confidence decision ${decision.id}: ${decision.decision.substring(0, 60)}`,
|
||||
severity: "medium",
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
const topicCounts: Record<string, number> = {};
|
||||
for (const lesson of lessons) {
|
||||
const topic = lesson.split(":")[0].trim().toLowerCase();
|
||||
topicCounts[topic] = (topicCounts[topic] || 0) + 1;
|
||||
}
|
||||
|
||||
for (const [topic, count] of Object.entries(topicCounts)) {
|
||||
if (count > 1) {
|
||||
risks.push({
|
||||
description: `Repeated lesson on "${topic}" (${count} occurrences) suggests systemic risk`,
|
||||
severity: count >= 3 ? "high" : "medium",
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
return risks;
|
||||
}
|
||||
|
||||
private formatResult(result: PhaseResearchResult): string {
|
||||
const lines: string[] = [`Phase ${result.phase} Research:`, ""];
|
||||
|
||||
lines.push("Decisions:");
|
||||
for (const d of result.decisions) {
|
||||
lines.push(` [${d.id}|conf=${d.confidence.toFixed(2)}] ${d.decision}`);
|
||||
}
|
||||
|
||||
lines.push("");
|
||||
lines.push("Lessons:");
|
||||
for (const l of result.lessons) {
|
||||
lines.push(` - ${l}`);
|
||||
}
|
||||
|
||||
lines.push("");
|
||||
lines.push("Risks:");
|
||||
for (const r of result.risks) {
|
||||
lines.push(` [${r.severity}] ${r.description}`);
|
||||
}
|
||||
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,107 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { PlanCheckerAgent } from "../agents/plan-checker.js";
|
||||
|
||||
describe("PlanCheckerAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-plan-checker-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("detects missing required sections", () => {
|
||||
const agent = new PlanCheckerAgent();
|
||||
const results = agent.mechanicalPlanCheck(tempDir, "no sections here");
|
||||
|
||||
const missing = results.filter((r) => r.type === "missing_section");
|
||||
expect(missing.length).toBeGreaterThan(0);
|
||||
expect(missing.some((r) => r.description.includes("# Phase"))).toBe(true);
|
||||
expect(missing.some((r) => r.description.includes("## Phase Goal"))).toBe(true);
|
||||
expect(missing.some((r) => r.description.includes("## Plans"))).toBe(true);
|
||||
});
|
||||
|
||||
it("detects task ID gaps", () => {
|
||||
const plan = `
|
||||
# Phase 1
|
||||
## Phase Goal
|
||||
Build it
|
||||
## Plans
|
||||
### Task 1.1: T1.1
|
||||
stuff
|
||||
### Task 1.1: T1.3
|
||||
more stuff
|
||||
`;
|
||||
const agent = new PlanCheckerAgent();
|
||||
const results = agent.mechanicalPlanCheck(tempDir, plan);
|
||||
|
||||
const gaps = results.filter((r) => r.type === "task_id_gap");
|
||||
expect(gaps.length).toBeGreaterThan(0);
|
||||
});
|
||||
|
||||
it("detects missing must-haves", () => {
|
||||
const plan = `
|
||||
# Phase 1
|
||||
## Phase Goal
|
||||
Build
|
||||
## Plans
|
||||
### Task 1.1: T1.1
|
||||
Do the thing
|
||||
`;
|
||||
const agent = new PlanCheckerAgent();
|
||||
const results = agent.mechanicalPlanCheck(tempDir, plan);
|
||||
|
||||
const missingMustHaves = results.filter((r) => r.type === "missing_must_haves");
|
||||
expect(missingMustHaves.length).toBeGreaterThan(0);
|
||||
});
|
||||
|
||||
it("detects invalid wave ordering", () => {
|
||||
const plan = `
|
||||
# Phase 1
|
||||
## Phase Goal
|
||||
Goal
|
||||
## Plans
|
||||
## Wave 2
|
||||
tasks
|
||||
## Wave 1
|
||||
more tasks
|
||||
`;
|
||||
const agent = new PlanCheckerAgent();
|
||||
const results = agent.mechanicalPlanCheck(tempDir, plan);
|
||||
|
||||
const waveInvalid = results.filter((r) => r.type === "wave_order_invalid");
|
||||
expect(waveInvalid.length).toBeGreaterThan(0);
|
||||
expect(waveInvalid[0].severity).toBe("P0");
|
||||
});
|
||||
|
||||
it("detects uncovered requirements", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(
|
||||
path.join(ciagentDir, "REQUIREMENTS.md"),
|
||||
"REQ-1: First requirement\nREQ-2: Second requirement\nREQ-3: Third requirement"
|
||||
);
|
||||
|
||||
const plan = `
|
||||
# Phase 1
|
||||
## Phase Goal
|
||||
Goal
|
||||
## Plans
|
||||
REQ-1 is covered
|
||||
`;
|
||||
const agent = new PlanCheckerAgent();
|
||||
const results = agent.mechanicalPlanCheck(tempDir, plan);
|
||||
|
||||
const uncovered = results.filter((r) => r.type === "uncovered_requirement");
|
||||
expect(uncovered.length).toBe(2);
|
||||
});
|
||||
|
||||
it("agent name is plan-checker", () => {
|
||||
const agent = new PlanCheckerAgent();
|
||||
expect(agent.name).toBe("plan-checker");
|
||||
});
|
||||
});
|
||||
+153
-4
@@ -1,5 +1,16 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface PlanCheckResult {
|
||||
type: "missing_section" | "task_id_gap" | "missing_must_haves" | "wave_order_invalid" | "uncovered_requirement";
|
||||
severity: "P0" | "P1" | "P2";
|
||||
description: string;
|
||||
taskId?: string;
|
||||
}
|
||||
|
||||
const REQUIRED_SECTIONS = ["# Phase", "## Phase Goal", "## Plans"];
|
||||
|
||||
export class PlanCheckerAgent extends BaseAgent {
|
||||
readonly name = "plan-checker";
|
||||
readonly description = "Verifies plan quality. On ISSUES FOUND, triggers automatic plan revision (up to 3 iterations).";
|
||||
@@ -8,6 +19,7 @@ export class PlanCheckerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Checking plan quality...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +27,151 @@ export class PlanCheckerAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const planPath = path.join(context.project_path, ".ciagent", "PLAN.md");
|
||||
let planContent = "";
|
||||
if (fs.existsSync(planPath)) {
|
||||
planContent = fs.readFileSync(planPath, "utf-8");
|
||||
}
|
||||
|
||||
const results = this.mechanicalPlanCheck(context.project_path, planContent);
|
||||
const p0Count = results.filter((r) => r.severity === "P0").length;
|
||||
const output = this.formatResults(results);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Plan checking requires an intelligence backend.",
|
||||
success: p0Count === 0,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: p0Count,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: p0Count > 0 ? `${p0Count} P0 issue(s) found` : undefined,
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalPlanCheck(projectPath: string, planContent: string): PlanCheckResult[] {
|
||||
const results: PlanCheckResult[] = [];
|
||||
|
||||
this.checkStructure(planContent, results);
|
||||
this.checkTaskIds(planContent, results);
|
||||
this.checkMustHavesPresent(planContent, results);
|
||||
this.checkWaveOrdering(planContent, results);
|
||||
this.checkRequirementCoverage(projectPath, planContent, results);
|
||||
|
||||
return results;
|
||||
}
|
||||
|
||||
checkStructure(planContent: string, results: PlanCheckResult[]): void {
|
||||
for (const section of REQUIRED_SECTIONS) {
|
||||
if (!planContent.includes(section)) {
|
||||
results.push({
|
||||
type: "missing_section",
|
||||
severity: "P0",
|
||||
description: `Plan is missing required section: ${section}`,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
checkTaskIds(planContent: string, results: PlanCheckResult[]): void {
|
||||
const taskIdRegex = /###?\s+Task\s+[\d.]+[:\s]+T?([\d.]+)/gi;
|
||||
const ids: number[] = [];
|
||||
let match;
|
||||
while ((match = taskIdRegex.exec(planContent)) !== null) {
|
||||
const idParts = match[1].split(".");
|
||||
const taskId = parseInt(idParts[idParts.length - 1], 10);
|
||||
if (!isNaN(taskId)) ids.push(taskId);
|
||||
}
|
||||
|
||||
if (ids.length === 0) return;
|
||||
|
||||
for (let i = 1; i <= Math.max(...ids); i++) {
|
||||
if (!ids.includes(i)) {
|
||||
results.push({
|
||||
type: "task_id_gap",
|
||||
severity: "P1",
|
||||
description: `Task ID gap: missing Task ${i}`,
|
||||
taskId: `T${i}`,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
checkMustHavesPresent(planContent: string, results: PlanCheckResult[]): void {
|
||||
const taskRegex = /###?\s+Task[^]*?(?=###?\s+Task|$)/g;
|
||||
const taskBlocks = planContent.match(taskRegex) || [];
|
||||
|
||||
for (const block of taskBlocks) {
|
||||
const headerMatch = block.match(/###?\s+Task\s+([\d.]+)/);
|
||||
if (!headerMatch) continue;
|
||||
const taskId = headerMatch[1];
|
||||
const hasMustHaves = /must.haves|acceptance.criteria|must.?have/i.test(block);
|
||||
if (!hasMustHaves) {
|
||||
results.push({
|
||||
type: "missing_must_haves",
|
||||
severity: "P1",
|
||||
description: `Task ${taskId} is missing must-haves/acceptance criteria`,
|
||||
taskId,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
checkWaveOrdering(planContent: string, results: PlanCheckResult[]): void {
|
||||
const waveRegex = /##?\s+Wave\s+(\d+)/gi;
|
||||
const waves: number[] = [];
|
||||
let match;
|
||||
while ((match = waveRegex.exec(planContent)) !== null) {
|
||||
waves.push(parseInt(match[1], 10));
|
||||
}
|
||||
|
||||
for (let i = 1; i < waves.length; i++) {
|
||||
if (waves[i] < waves[i - 1]) {
|
||||
results.push({
|
||||
type: "wave_order_invalid",
|
||||
severity: "P0",
|
||||
description: `Wave ordering invalid: Wave ${waves[i]} appears after Wave ${waves[i - 1]}`,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
checkRequirementCoverage(projectPath: string, planContent: string, results: PlanCheckResult[]): void {
|
||||
const reqPath = path.join(projectPath, ".ciagent", "REQUIREMENTS.md");
|
||||
if (!fs.existsSync(reqPath)) return;
|
||||
|
||||
const reqContent = fs.readFileSync(reqPath, "utf-8");
|
||||
const reqIdRegex = /REQ-(\d+)/g;
|
||||
const requirements = new Set<string>();
|
||||
let reqMatch;
|
||||
while ((reqMatch = reqIdRegex.exec(reqContent)) !== null) {
|
||||
requirements.add(`REQ-${reqMatch[1]}`);
|
||||
}
|
||||
|
||||
const planReqIdRegex = /REQ-(\d+)/g;
|
||||
const coveredReqs = new Set<string>();
|
||||
let planMatch;
|
||||
while ((planMatch = planReqIdRegex.exec(planContent)) !== null) {
|
||||
coveredReqs.add(`REQ-${planMatch[1]}`);
|
||||
}
|
||||
|
||||
for (const req of requirements) {
|
||||
if (!coveredReqs.has(req)) {
|
||||
results.push({
|
||||
type: "uncovered_requirement",
|
||||
severity: "P2",
|
||||
description: `Requirement ${req} not covered in plan`,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
private formatResults(results: PlanCheckResult[]): string {
|
||||
if (results.length === 0) return "Plan check passed — no issues found.";
|
||||
const lines: string[] = ["Plan Check Results:", ""];
|
||||
for (const r of results) {
|
||||
lines.push(`[${r.type}|${r.severity}] ${r.description}${r.taskId ? ` (task: ${r.taskId})` : ""}`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,167 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { PlannerAgent } from "../agents/planner.js";
|
||||
import { AgentContext } from "../agents/base.js";
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult } from "../backends/types.js";
|
||||
import { Decision } from "../types/decisions.js";
|
||||
import { Escalation } from "../types/escalation.js";
|
||||
import { emptyTokenUsage } from "../backends/types.js";
|
||||
|
||||
class MockBackend implements IntelligenceBackend {
|
||||
readonly name = "mock";
|
||||
readonly type = "llm" as const;
|
||||
async isAvailable(): Promise<boolean> { return true; }
|
||||
async execute(request: BackendRequest): Promise<BackendResult> {
|
||||
return {
|
||||
success: true,
|
||||
output: `Mock backend executed: ${request.task.slice(0, 50)}`,
|
||||
artifacts: [],
|
||||
decisions: [],
|
||||
escalations: [],
|
||||
usage: emptyTokenUsage(),
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
function createTempDir(): string {
|
||||
return fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-planner-test-"));
|
||||
}
|
||||
|
||||
function cleanup(dir: string): void {
|
||||
fs.rmSync(dir, { recursive: true, force: true });
|
||||
}
|
||||
|
||||
function makeContext(dir: string, backend?: IntelligenceBackend): AgentContext {
|
||||
return {
|
||||
project_path: dir,
|
||||
phase: 1,
|
||||
stage: "plan",
|
||||
specification: "Build a REST API for task management",
|
||||
config_path: path.join(dir, ".ciagent", "config.json"),
|
||||
backend,
|
||||
};
|
||||
}
|
||||
|
||||
function setupCIAgentDir(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
fs.mkdirSync(ciDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciDir, "config.json"), "{}");
|
||||
}
|
||||
|
||||
function writeRequirementsMd(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
const content = [
|
||||
"# Requirements",
|
||||
"",
|
||||
"## v1 Requirements",
|
||||
"",
|
||||
"### Core",
|
||||
"",
|
||||
"- [ ] **REQ-01**: User authentication",
|
||||
"- [ ] **REQ-02**: Task CRUD operations",
|
||||
"- [ ] **REQ-03**: Real-time notifications",
|
||||
"",
|
||||
"## Traceability",
|
||||
"",
|
||||
"| Requirement | Phase | Status |",
|
||||
"|-------------|-------|--------|",
|
||||
"| REQ-01 | Phase 1 | in_progress |",
|
||||
"| REQ-02 | Phase 1 | pending |",
|
||||
"| REQ-03 | Phase 1 | blocked |",
|
||||
].join("\n");
|
||||
fs.writeFileSync(path.join(ciDir, "REQUIREMENTS.md"), content);
|
||||
}
|
||||
|
||||
function writeRoadmapMd(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
const content = [
|
||||
"# Roadmap",
|
||||
"",
|
||||
"## Overview",
|
||||
"",
|
||||
"Task management API roadmap",
|
||||
"",
|
||||
"## Phases",
|
||||
"",
|
||||
"- [ ] **Phase 1: Authentication** - Implement auth",
|
||||
"",
|
||||
"## Phase Details",
|
||||
"",
|
||||
"### Phase 1: Authentication",
|
||||
"**Goal**: Implement user authentication",
|
||||
"**Depends on**: Nothing",
|
||||
"**Requirements**: REQ-01, REQ-02",
|
||||
"**Success Criteria**:",
|
||||
"1. .ciagent/REQUIREMENTS.md exists",
|
||||
"**Status**: in_progress",
|
||||
].join("\n");
|
||||
fs.writeFileSync(path.join(ciDir, "ROADMAP.md"), content);
|
||||
}
|
||||
|
||||
describe("PlannerAgent", () => {
|
||||
let dir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
dir = createTempDir();
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
cleanup(dir);
|
||||
});
|
||||
|
||||
it("returns honest failure without backend when no requirements or roadmap", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
const planner = new PlannerAgent();
|
||||
const result = await planner.execute(makeContext(dir));
|
||||
expect(result.success).toBe(false);
|
||||
expect(result.error).toContain("No requirements or roadmap");
|
||||
});
|
||||
|
||||
it("creates PLAN.md from REQUIREMENTS.md without backend", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
writeRequirementsMd(dir);
|
||||
writeRoadmapMd(dir);
|
||||
|
||||
const planner = new PlannerAgent();
|
||||
const result = await planner.execute(makeContext(dir));
|
||||
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("plan");
|
||||
expect(fs.existsSync(path.join(dir, ".ciagent", "PLAN.md"))).toBe(true);
|
||||
});
|
||||
|
||||
it("PLAN.md contains phase goal and tasks", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
writeRequirementsMd(dir);
|
||||
writeRoadmapMd(dir);
|
||||
|
||||
const planner = new PlannerAgent();
|
||||
await planner.execute(makeContext(dir));
|
||||
|
||||
const planContent = fs.readFileSync(path.join(dir, ".ciagent", "PLAN.md"), "utf-8");
|
||||
expect(planContent).toContain("Phase 1 Plan");
|
||||
expect(planContent).toContain("Phase Goal");
|
||||
expect(planContent).toContain("Tasks");
|
||||
});
|
||||
|
||||
it("delegates to backend when available", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
const mockBackend = new MockBackend();
|
||||
const planner = new PlannerAgent();
|
||||
const result = await planner.execute(makeContext(dir, mockBackend));
|
||||
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("Mock backend executed");
|
||||
});
|
||||
|
||||
it("has correct agent name", () => {
|
||||
const planner = new PlannerAgent();
|
||||
expect(planner.name).toBe("planner");
|
||||
});
|
||||
|
||||
it("has correct workflow", () => {
|
||||
const planner = new PlannerAgent();
|
||||
expect(planner.workflow).toBe("plan");
|
||||
});
|
||||
});
|
||||
+323
-9
@@ -1,4 +1,27 @@
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
import { CIAgentFiles, RequirementsMd, RoadmapMd, ArchitectureMd } from "../core/ciagent-files.js";
|
||||
import { GitContext } from "../core/git-context.js";
|
||||
import { CommitBuilder } from "../core/commit-builder.js";
|
||||
import { writeFile, readFile, ensureDir } from "../utils/file.js";
|
||||
import { execSync } from "node:child_process";
|
||||
import * as path from "node:path";
|
||||
|
||||
export interface PlannerResult {
|
||||
success: boolean;
|
||||
planCount: number;
|
||||
waves: { wave: number; plans: string[] }[];
|
||||
decisions: number;
|
||||
error?: string;
|
||||
}
|
||||
|
||||
interface PlanEntry {
|
||||
name: string;
|
||||
wave: number;
|
||||
requirements: string[];
|
||||
dependsOn: string[];
|
||||
tasks: string[];
|
||||
mustHaves: string[];
|
||||
}
|
||||
|
||||
export class PlannerAgent extends BaseAgent {
|
||||
readonly name = "planner";
|
||||
@@ -8,21 +31,312 @@ export class PlannerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Creating phase plan...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
`Create a phase plan for stage ${context.stage}, phase ${context.phase}. Specification: ${context.specification}`
|
||||
);
|
||||
const taskPrompt = await this.buildBackendTaskPrompt(context);
|
||||
const result = await this.executeViaBackend(context, taskPrompt);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
return this.executeMechanical(context, start);
|
||||
}
|
||||
|
||||
private async buildBackendTaskPrompt(context: AgentContext): Promise<string> {
|
||||
const ciFiles = new CIAgentFiles(context.project_path);
|
||||
const parts: string[] = [
|
||||
`Create a phase plan for stage ${context.stage}, phase ${context.phase}.`,
|
||||
"",
|
||||
"## Project Context",
|
||||
];
|
||||
|
||||
const roadmap = ciFiles.readRoadmapMd();
|
||||
if (roadmap) {
|
||||
const currentPhase = roadmap.phases.find((p) => p.number === context.phase);
|
||||
if (currentPhase) {
|
||||
parts.push("", "### Phase Goal", currentPhase.description);
|
||||
parts.push("", "### Phase Requirements", currentPhase.requirements.join(", ") || "None specified");
|
||||
parts.push("", "### Phase Dependencies", currentPhase.dependsOn.length > 0 ? currentPhase.dependsOn.map((d) => `Phase ${d}`).join(", ") : "None");
|
||||
parts.push("", "### Success Criteria", ...currentPhase.successCriteria.map((sc) => `- ${sc}`));
|
||||
}
|
||||
}
|
||||
|
||||
const requirements = ciFiles.readRequirementsMd();
|
||||
if (requirements) {
|
||||
const phaseReqs = requirements.traceability.filter((t) => t.phase === context.phase);
|
||||
if (phaseReqs.length > 0) {
|
||||
parts.push("", "### Requirements for Phase", ...phaseReqs.map((t) => `- ${t.requirement} (${t.status})`));
|
||||
}
|
||||
}
|
||||
|
||||
const architecture = ciFiles.readArchitectureMd();
|
||||
if (architecture) {
|
||||
parts.push("", "### Architecture Boundaries", ...architecture.components.map((c) => `- ${c.name}: ${c.boundaries}`));
|
||||
parts.push("", "### Build Order", ...architecture.buildOrder.map((bo) => `${bo}`));
|
||||
}
|
||||
|
||||
parts.push("", "## Specification", context.specification || "No specification provided");
|
||||
|
||||
return parts.join("\n");
|
||||
}
|
||||
|
||||
private executeMechanical(context: AgentContext, start: number): AgentResult {
|
||||
const ciFiles = new CIAgentFiles(context.project_path);
|
||||
ciFiles.ensureCIDir();
|
||||
|
||||
const requirements = ciFiles.readRequirementsMd();
|
||||
const roadmap = ciFiles.readRoadmapMd();
|
||||
const architecture = ciFiles.readArchitectureMd();
|
||||
|
||||
if (!requirements && !roadmap) {
|
||||
return {
|
||||
success: false,
|
||||
output: "Planning requires either .ciagent/REQUIREMENTS.md or .ciagent/ROADMAP.md. Initialize the project first.",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No requirements or roadmap found for mechanical planning",
|
||||
};
|
||||
}
|
||||
|
||||
let gitLogSummary = "";
|
||||
try {
|
||||
gitLogSummary = execSync("git log --max-count=20 --oneline", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
}).trim();
|
||||
} catch {
|
||||
gitLogSummary = "(no git history available)";
|
||||
}
|
||||
|
||||
const phaseGoal = this.extractPhaseGoal(roadmap, context.phase);
|
||||
const phaseRequirements = this.extractPhaseRequirements(requirements, context.phase);
|
||||
const componentBoundaries = architecture ? architecture.components.map((c) => c.name) : [];
|
||||
|
||||
const plans = this.buildPlans(phaseRequirements, componentBoundaries, context.phase);
|
||||
|
||||
const planFileContent = this.formatPlanFile(context.phase, phaseGoal, plans);
|
||||
|
||||
const planFilePath = path.join(context.project_path, ".ciagent", "PLAN.md");
|
||||
ensureDir(path.dirname(planFilePath));
|
||||
writeFile(planFilePath, planFileContent);
|
||||
|
||||
const decisionCount = plans.length > 0 ? 1 : 0;
|
||||
|
||||
if (this.shouldCommit(context)) {
|
||||
try {
|
||||
const commitMessage = CommitBuilder.buildTaskCommit({
|
||||
type: "docs",
|
||||
phase: context.phase,
|
||||
milestone: "v1.0",
|
||||
plan: "01",
|
||||
task: "01-01",
|
||||
subject: `create ${plans.length} phase plans`,
|
||||
status: "plan",
|
||||
decisions: decisionCount > 0 ? [{
|
||||
id: "D-001",
|
||||
decision: `Decomposed phase ${context.phase} into ${plans.length} vertical-slice plans`,
|
||||
rationale: "Requirements grouped by dependency analysis — independent requirements in wave 1, dependent in wave 2+",
|
||||
confidence: 0.75,
|
||||
alternatives: ["single monolithic plan", "per-requirement plans"],
|
||||
}] : undefined,
|
||||
});
|
||||
execSync(`git add -A && git commit -m "${commitMessage.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
} catch {
|
||||
this.warn("Plan commit failed");
|
||||
}
|
||||
}
|
||||
|
||||
const waves = this.groupPlansByWave(plans);
|
||||
const plannerResult: PlannerResult = {
|
||||
success: true,
|
||||
planCount: plans.length,
|
||||
waves,
|
||||
decisions: decisionCount,
|
||||
};
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Planning requires an intelligence backend. Configure one with: ci init --backend",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
success: true,
|
||||
output: `Created ${plans.length} plan(s) across ${waves.length} wave(s) for phase ${context.phase}`,
|
||||
artifacts_created: [".ciagent/PLAN.md"],
|
||||
decisions: decisionCount,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
private extractPhaseGoal(roadmap: RoadmapMd | null, phase: number): string {
|
||||
if (!roadmap) return "No roadmap available";
|
||||
const phaseEntry = roadmap.phases.find((p) => p.number === phase);
|
||||
if (phaseEntry) return `${phaseEntry.name}: ${phaseEntry.description}`;
|
||||
return `Phase ${phase} (no roadmap entry)`;
|
||||
}
|
||||
|
||||
private extractPhaseRequirements(requirements: RequirementsMd | null, phase: number): Array<{ id: string; description: string; phase: number; status: string }> {
|
||||
if (!requirements) return [];
|
||||
return requirements.traceability
|
||||
.filter((t) => t.phase === phase)
|
||||
.map((t) => {
|
||||
let description = t.requirement;
|
||||
for (const cat of [...requirements.v1, ...requirements.v2]) {
|
||||
const item = cat.items.find((i) => i.id === t.requirement);
|
||||
if (item) {
|
||||
description = `${t.requirement}: ${item.description}`;
|
||||
break;
|
||||
}
|
||||
}
|
||||
return { id: t.requirement, description, phase: t.phase, status: t.status };
|
||||
});
|
||||
}
|
||||
|
||||
private buildPlans(
|
||||
phaseRequirements: Array<{ id: string; description: string; phase: number; status: string }>,
|
||||
componentBoundaries: string[],
|
||||
phase: number
|
||||
): PlanEntry[] {
|
||||
if (phaseRequirements.length === 0) {
|
||||
return [{
|
||||
name: `Phase ${phase} Core Implementation`,
|
||||
wave: 1,
|
||||
requirements: [],
|
||||
dependsOn: [],
|
||||
tasks: [`Implement phase ${phase} deliverables as specified in ROADMAP.md`],
|
||||
mustHaves: [`Phase ${phase} deliverables exist and pass verification`],
|
||||
}];
|
||||
}
|
||||
|
||||
const independentReqs = phaseRequirements.filter((r) => r.status !== "blocked");
|
||||
const blockedReqs = phaseRequirements.filter((r) => r.status === "blocked");
|
||||
|
||||
const plans: PlanEntry[] = [];
|
||||
|
||||
if (independentReqs.length > 0) {
|
||||
const taskChunks = this.chunkByComponent(independentReqs, componentBoundaries);
|
||||
for (const chunk of taskChunks) {
|
||||
plans.push({
|
||||
name: this.inferPlanName(chunk, phase),
|
||||
wave: 1,
|
||||
requirements: chunk.map((r) => r.id),
|
||||
dependsOn: [],
|
||||
tasks: chunk.map((r) => {
|
||||
const desc = r.description.split(": ").slice(1).join(": ") || r.description;
|
||||
return desc !== r.id ? `Implement ${r.id}: ${desc}` : `Implement ${r.id}`;
|
||||
}),
|
||||
mustHaves: chunk.map((r) => `${r.id} implemented and testable`),
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
if (blockedReqs.length > 0) {
|
||||
const taskChunks = this.chunkByComponent(blockedReqs, componentBoundaries);
|
||||
for (const chunk of taskChunks) {
|
||||
plans.push({
|
||||
name: this.inferPlanName(chunk, phase),
|
||||
wave: plans.length > 0 ? Math.max(...plans.map((p) => p.wave)) + 1 : 2,
|
||||
requirements: chunk.map((r) => r.id),
|
||||
dependsOn: plans.slice(0, plans.length > 0 ? 1 : 0).map((p) => p.name),
|
||||
tasks: chunk.map((r) => {
|
||||
const desc = r.description.split(": ").slice(1).join(": ") || r.description;
|
||||
return desc !== r.id ? `Implement ${r.id}: ${desc}` : `Implement ${r.id}`;
|
||||
}),
|
||||
mustHaves: chunk.map((r) => `${r.id} implemented and testable`),
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
if (plans.length === 0) {
|
||||
plans.push({
|
||||
name: `Phase ${phase} Default`,
|
||||
wave: 1,
|
||||
requirements: [],
|
||||
dependsOn: [],
|
||||
tasks: [`Implement phase ${phase} deliverables`],
|
||||
mustHaves: [`Phase ${phase} deliverables pass verification`],
|
||||
});
|
||||
}
|
||||
|
||||
return plans;
|
||||
}
|
||||
|
||||
private chunkByComponent(
|
||||
reqs: Array<{ id: string; description: string; phase: number; status: string }>,
|
||||
_componentBoundaries: string[]
|
||||
): Array<Array<{ id: string; description: string; phase: number; status: string }>> {
|
||||
if (reqs.length <= 3) return [reqs];
|
||||
const chunks: Array<Array<{ id: string; description: string; phase: number; status: string }>> = [];
|
||||
const chunkSize = Math.ceil(reqs.length / Math.ceil(reqs.length / 3));
|
||||
for (let i = 0; i < reqs.length; i += chunkSize) {
|
||||
chunks.push(reqs.slice(i, i + chunkSize));
|
||||
}
|
||||
return chunks;
|
||||
}
|
||||
|
||||
private inferPlanName(chunk: Array<{ id: string; description: string; phase: number; status: string }>, phase: number): string {
|
||||
if (chunk.length === 1) return `Phase ${phase}: ${chunk[0].id}`;
|
||||
return `Phase ${phase}: ${chunk[0].id}–${chunk[chunk.length - 1].id}`;
|
||||
}
|
||||
|
||||
private groupPlansByWave(plans: PlanEntry[]): { wave: number; plans: string[] }[] {
|
||||
const waveMap = new Map<number, string[]>();
|
||||
for (const plan of plans) {
|
||||
const existing = waveMap.get(plan.wave) || [];
|
||||
existing.push(plan.name);
|
||||
waveMap.set(plan.wave, existing);
|
||||
}
|
||||
return Array.from(waveMap.entries())
|
||||
.sort((a, b) => a[0] - b[0])
|
||||
.map(([wave, names]) => ({ wave, plans: names }));
|
||||
}
|
||||
|
||||
private formatPlanFile(phase: number, phaseGoal: string, plans: PlanEntry[]): string {
|
||||
const lines: string[] = [
|
||||
`# Phase ${phase} Plan`,
|
||||
"",
|
||||
"## Phase Goal",
|
||||
phaseGoal,
|
||||
"",
|
||||
"## Plans",
|
||||
"",
|
||||
];
|
||||
|
||||
for (let i = 0; i < plans.length; i++) {
|
||||
const plan = plans[i];
|
||||
const planNum = i + 1;
|
||||
lines.push(`### Plan ${planNum}: ${plan.name}`);
|
||||
lines.push(`- Wave: ${plan.wave}`);
|
||||
if (plan.requirements.length > 0) {
|
||||
lines.push(`- Requirements: [${plan.requirements.join(", ")}]`);
|
||||
}
|
||||
if (plan.dependsOn.length > 0) {
|
||||
lines.push(`- Depends on: ${plan.dependsOn.join(", ")}`);
|
||||
}
|
||||
lines.push("- Tasks:");
|
||||
for (const task of plan.tasks) {
|
||||
lines.push(` 1. ${task}`);
|
||||
}
|
||||
lines.push("- Must-haves:");
|
||||
for (const mh of plan.mustHaves) {
|
||||
lines.push(` - [x] ${mh}`);
|
||||
}
|
||||
lines.push("");
|
||||
}
|
||||
|
||||
return lines.join("\n");
|
||||
}
|
||||
|
||||
private shouldCommit(context: AgentContext): boolean {
|
||||
try {
|
||||
execSync("git rev-parse --is-inside-work-tree", {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
return true;
|
||||
} catch {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,93 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { ProjectResearcherAgent } from "../agents/project-researcher.js";
|
||||
|
||||
describe("ProjectResearcherAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-project-researcher-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("reads package.json and categorizes dependencies", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "package.json"),
|
||||
JSON.stringify({
|
||||
dependencies: { express: "^4.18.0", graphql: "^16.0.0" },
|
||||
devDependencies: { jest: "^29.0.0", typescript: "^5.0.0" },
|
||||
})
|
||||
);
|
||||
|
||||
const agent = new ProjectResearcherAgent();
|
||||
const pkg = agent.readPackageJson(tempDir);
|
||||
const tsconfig = {};
|
||||
const summary = agent.categorizeFindings(pkg, tsconfig, []);
|
||||
|
||||
expect(summary.frameworks).toContain("express");
|
||||
expect(summary.frameworks).toContain("jest");
|
||||
expect(summary.apis).toContain("graphql");
|
||||
expect(summary.tooling).toContain("typescript");
|
||||
});
|
||||
|
||||
it("reads tsconfig and extracts compiler options", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, "tsconfig.json"),
|
||||
JSON.stringify({
|
||||
compilerOptions: { target: "ES2022", module: "Node16" },
|
||||
})
|
||||
);
|
||||
|
||||
const agent = new ProjectResearcherAgent();
|
||||
const tsconfig = agent.readTsconfig(tempDir);
|
||||
|
||||
expect((tsconfig.compilerOptions as Record<string, unknown>).target).toBe("ES2022");
|
||||
expect((tsconfig.compilerOptions as Record<string, unknown>).module).toBe("Node16");
|
||||
});
|
||||
|
||||
it("categorizes tooling from scripts and engines", () => {
|
||||
const pkg = {
|
||||
scripts: { build: "tsc", test: "jest", lint: "eslint ." },
|
||||
engines: { node: ">=18.0.0" },
|
||||
};
|
||||
|
||||
const agent = new ProjectResearcherAgent();
|
||||
const summary = agent.categorizeFindings(pkg, {}, []);
|
||||
|
||||
expect(summary.tooling).toContain("build_script");
|
||||
expect(summary.tooling).toContain("test_script");
|
||||
expect(summary.tooling).toContain("lint_script");
|
||||
expect(summary.tooling).toContain("node:>=18.0.0");
|
||||
});
|
||||
|
||||
it("detects patterns from devDependencies", () => {
|
||||
const pkg = {
|
||||
devDependencies: { jest: "^29.0.0", tsyringe: "^4.8.0" },
|
||||
};
|
||||
|
||||
const agent = new ProjectResearcherAgent();
|
||||
const summary = agent.categorizeFindings(pkg, {}, []);
|
||||
|
||||
expect(summary.patterns).toContain("test_driven");
|
||||
expect(summary.patterns).toContain("dependency_injection");
|
||||
});
|
||||
|
||||
it("returns empty summary when no package.json exists", () => {
|
||||
const agent = new ProjectResearcherAgent();
|
||||
const summary = agent.mechanicalProjectResearch(tempDir);
|
||||
|
||||
expect(summary.frameworks).toEqual([]);
|
||||
expect(summary.apis).toEqual([]);
|
||||
expect(summary.patterns).toEqual([]);
|
||||
expect(summary.technologyDecisions).toEqual([]);
|
||||
});
|
||||
|
||||
it("agent name is project-researcher", () => {
|
||||
const agent = new ProjectResearcherAgent();
|
||||
expect(agent.name).toBe("project-researcher");
|
||||
});
|
||||
});
|
||||
@@ -1,5 +1,57 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface EcosystemSummary {
|
||||
frameworks: string[];
|
||||
apis: string[];
|
||||
patterns: string[];
|
||||
tooling: string[];
|
||||
technologyDecisions: Array<{ id: string; decision: string; confidence: number }>;
|
||||
}
|
||||
|
||||
const FRAMEWORK_PATTERNS: Record<string, string[]> = {
|
||||
react: ["react"],
|
||||
vue: ["vue"],
|
||||
angular: ["@angular/core"],
|
||||
svelte: ["svelte"],
|
||||
express: ["express"],
|
||||
fastify: ["fastify"],
|
||||
nestjs: ["@nestjs/core"],
|
||||
next: ["next"],
|
||||
nuxt: ["nuxt"],
|
||||
koa: ["koa"],
|
||||
jest: ["jest"],
|
||||
vitest: ["vitest"],
|
||||
};
|
||||
|
||||
const API_PATTERNS: Record<string, string[]> = {
|
||||
graphql: ["graphql", "apollo", "@apollo"],
|
||||
rest: ["express", "fastify", "restana"],
|
||||
grpc: ["grpc", "@grpc"],
|
||||
websocket: ["ws", "socket.io"],
|
||||
};
|
||||
|
||||
const PATTERN_PATTERNS: Record<string, string[]> = {
|
||||
microservices: ["@nestjs/microservices", "amqplib", "kafkajs"],
|
||||
middleware: ["express", "koa", "fastify"],
|
||||
cqrs: ["@nestjs/cqrs"],
|
||||
dependency_injection: ["inversify", "tsyringe", "@nestjs/core"],
|
||||
test_driven: ["jest", "vitest", "mocha"],
|
||||
};
|
||||
|
||||
const TOOLING_PATTERNS: Record<string, string[]> = {
|
||||
typescript: ["typescript"],
|
||||
eslint: ["eslint"],
|
||||
prettier: ["prettier"],
|
||||
webpack: ["webpack"],
|
||||
vite: ["vite"],
|
||||
rollup: ["rollup"],
|
||||
esbuild: ["esbuild"],
|
||||
docker: [],
|
||||
ci_cd: [],
|
||||
};
|
||||
|
||||
export class ProjectResearcherAgent extends BaseAgent {
|
||||
readonly name = "project-researcher";
|
||||
readonly description = "Researches the domain ecosystem for a new project.";
|
||||
@@ -8,6 +60,7 @@ export class ProjectResearcherAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Researching project domain ecosystem...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +68,203 @@ export class ProjectResearcherAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const summary = this.mechanicalProjectResearch(context.project_path);
|
||||
const output = this.formatSummary(summary);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Project research requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
decisions: summary.technologyDecisions.length,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalProjectResearch(projectPath: string): EcosystemSummary {
|
||||
const pkg = this.readPackageJson(projectPath);
|
||||
const tsconfig = this.readTsconfig(projectPath);
|
||||
const techDecisions = this.readTechDecisions(projectPath);
|
||||
const summary = this.categorizeFindings(pkg, tsconfig, techDecisions);
|
||||
return summary;
|
||||
}
|
||||
|
||||
readPackageJson(projectPath: string): Record<string, unknown> {
|
||||
const pkgPath = path.join(projectPath, "package.json");
|
||||
if (!fs.existsSync(pkgPath)) return {};
|
||||
try {
|
||||
return JSON.parse(fs.readFileSync(pkgPath, "utf-8"));
|
||||
} catch {
|
||||
return {};
|
||||
}
|
||||
}
|
||||
|
||||
readTsconfig(projectPath: string): Record<string, unknown> {
|
||||
const tsconfigPath = path.join(projectPath, "tsconfig.json");
|
||||
if (!fs.existsSync(tsconfigPath)) return {};
|
||||
try {
|
||||
return JSON.parse(fs.readFileSync(tsconfigPath, "utf-8"));
|
||||
} catch {
|
||||
return {};
|
||||
}
|
||||
}
|
||||
|
||||
readTechDecisions(projectPath: string): Array<{ id: string; decision: string; confidence: number }> {
|
||||
const decisions: Array<{ id: string; decision: string; confidence: number }> = [];
|
||||
const techCategories = ["technology_choice", "implementation_approach", "architecture"];
|
||||
|
||||
try {
|
||||
const { execSync } = require("node:child_process");
|
||||
const logContent = execSync(
|
||||
`git log --all --format="%B" -100`,
|
||||
{ cwd: projectPath, encoding: "utf-8", timeout: 5000 }
|
||||
);
|
||||
|
||||
const categoryRegex = /category:\s*(\S+)/g;
|
||||
const decisionRegex = /decisions:\s*\n((?:\s+-\s+.+\n?)+)/g;
|
||||
let catMatch;
|
||||
let match;
|
||||
|
||||
const blocks: Array<{ categories: string[]; items: string[] }> = [];
|
||||
let currentCategories: string[] = [];
|
||||
|
||||
while ((catMatch = categoryRegex.exec(logContent)) !== null) {
|
||||
currentCategories.push(catMatch[1].toLowerCase());
|
||||
}
|
||||
|
||||
while ((match = decisionRegex.exec(logContent)) !== null) {
|
||||
const items = match[1].split("\n").filter((l: string) => l.trim().startsWith("-"));
|
||||
blocks.push({
|
||||
categories: [...currentCategories],
|
||||
items: items.map((i: string) => i.replace(/^\s*-\s*/, "").trim()),
|
||||
});
|
||||
}
|
||||
|
||||
for (const block of blocks) {
|
||||
const isTech = block.categories.some((c) => techCategories.includes(c));
|
||||
if (!isTech && block.categories.length > 0) continue;
|
||||
|
||||
for (const item of block.items) {
|
||||
const idMatch = item.match(/D-(\d+)/);
|
||||
const id = idMatch ? `D-${idMatch[1]}` : `D-${decisions.length + 1}`;
|
||||
const confMatch = item.match(/confidence[:\s]+(\d+\.?\d*)/);
|
||||
const confidence = confMatch ? parseFloat(confMatch[1]) : 0.5;
|
||||
decisions.push({ id, decision: item, confidence });
|
||||
}
|
||||
}
|
||||
} catch {
|
||||
// git not available or no commits
|
||||
}
|
||||
|
||||
return decisions;
|
||||
}
|
||||
|
||||
categorizeFindings(
|
||||
pkg: Record<string, unknown>,
|
||||
tsconfig: Record<string, unknown>,
|
||||
techDecisions: Array<{ id: string; decision: string; confidence: number }>
|
||||
): EcosystemSummary {
|
||||
const allDeps: string[] = [];
|
||||
const deps = pkg.dependencies as Record<string, string> | undefined;
|
||||
const devDeps = pkg.devDependencies as Record<string, string> | undefined;
|
||||
if (deps) allDeps.push(...Object.keys(deps));
|
||||
if (devDeps) allDeps.push(...Object.keys(devDeps));
|
||||
|
||||
const frameworks: string[] = [];
|
||||
for (const [name, depPatterns] of Object.entries(FRAMEWORK_PATTERNS)) {
|
||||
if (depPatterns.some((p) => allDeps.includes(p))) {
|
||||
frameworks.push(name);
|
||||
}
|
||||
}
|
||||
|
||||
const apis: string[] = [];
|
||||
for (const [name, depPatterns] of Object.entries(API_PATTERNS)) {
|
||||
if (depPatterns.some((p) => allDeps.includes(p))) {
|
||||
apis.push(name);
|
||||
}
|
||||
}
|
||||
|
||||
const patterns: string[] = [];
|
||||
for (const [name, depPatterns] of Object.entries(PATTERN_PATTERNS)) {
|
||||
if (depPatterns.some((p) => allDeps.includes(p))) {
|
||||
patterns.push(name);
|
||||
}
|
||||
}
|
||||
|
||||
const tooling: string[] = [];
|
||||
for (const [name, depPatterns] of Object.entries(TOOLING_PATTERNS)) {
|
||||
if (depPatterns.some((p) => allDeps.includes(p))) {
|
||||
tooling.push(name);
|
||||
}
|
||||
}
|
||||
|
||||
const compilerOptions = tsconfig.compilerOptions as Record<string, unknown> | undefined;
|
||||
if (compilerOptions) {
|
||||
const target = compilerOptions.target as string | undefined;
|
||||
if (target) tooling.push(`es_target:${target.toLowerCase()}`);
|
||||
const module = compilerOptions.module as string | undefined;
|
||||
if (module) tooling.push(`module_system:${module.toLowerCase()}`);
|
||||
}
|
||||
|
||||
const scripts = pkg.scripts as Record<string, string> | undefined;
|
||||
if (scripts) {
|
||||
if (scripts.build) tooling.push("build_script");
|
||||
if (scripts.test) tooling.push("test_script");
|
||||
if (scripts.lint) tooling.push("lint_script");
|
||||
}
|
||||
|
||||
const engines = pkg.engines as Record<string, string> | undefined;
|
||||
if (engines && engines.node) {
|
||||
tooling.push(`node:${engines.node}`);
|
||||
}
|
||||
|
||||
return {
|
||||
frameworks,
|
||||
apis,
|
||||
patterns,
|
||||
tooling,
|
||||
technologyDecisions: techDecisions,
|
||||
};
|
||||
}
|
||||
|
||||
private formatSummary(summary: EcosystemSummary): string {
|
||||
const lines: string[] = ["Ecosystem Summary:", ""];
|
||||
|
||||
lines.push("Frameworks:");
|
||||
for (const f of summary.frameworks) {
|
||||
lines.push(` - ${f}`);
|
||||
}
|
||||
if (summary.frameworks.length === 0) lines.push(" (none detected)");
|
||||
|
||||
lines.push("");
|
||||
lines.push("APIs:");
|
||||
for (const a of summary.apis) {
|
||||
lines.push(` - ${a}`);
|
||||
}
|
||||
if (summary.apis.length === 0) lines.push(" (none detected)");
|
||||
|
||||
lines.push("");
|
||||
lines.push("Patterns:");
|
||||
for (const p of summary.patterns) {
|
||||
lines.push(` - ${p}`);
|
||||
}
|
||||
if (summary.patterns.length === 0) lines.push(" (none detected)");
|
||||
|
||||
lines.push("");
|
||||
lines.push("Tooling:");
|
||||
for (const t of summary.tooling) {
|
||||
lines.push(` - ${t}`);
|
||||
}
|
||||
if (summary.tooling.length === 0) lines.push(" (none detected)");
|
||||
|
||||
lines.push("");
|
||||
lines.push("Technology Decisions:");
|
||||
for (const d of summary.technologyDecisions) {
|
||||
lines.push(` [${d.id}|conf=${d.confidence.toFixed(2)}] ${d.decision}`);
|
||||
}
|
||||
if (summary.technologyDecisions.length === 0) lines.push(" (none found)");
|
||||
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,72 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { ResearchSynthesizerAgent } from "../agents/research-synthesizer.js";
|
||||
|
||||
describe("ResearchSynthesizerAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-synth-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("reads project files and extracts findings", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciagentDir, "ARCHITECTURE.md"), "# Architecture\n\n- Component A\n- Component B");
|
||||
fs.writeFileSync(path.join(ciagentDir, "REQUIREMENTS.md"), "# Requirements\n\n* REQ-1\n* REQ-2");
|
||||
|
||||
const agent = new ResearchSynthesizerAgent();
|
||||
const findings = agent.mechanicalSynthesize(tempDir);
|
||||
|
||||
expect(findings.length).toBeGreaterThan(0);
|
||||
const sources = findings.map((f) => f.source);
|
||||
expect(sources).toContain("ARCHITECTURE.md");
|
||||
expect(sources).toContain("REQUIREMENTS.md");
|
||||
});
|
||||
|
||||
it("merges overlapping topics from different sources", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciagentDir, "ARCHITECTURE.md"), "# Testing Strategy\n\n- Unit tests required");
|
||||
fs.writeFileSync(path.join(ciagentDir, "PROJECT.md"), "# Testing Strategy\n\n- Integration tests needed");
|
||||
|
||||
const agent = new ResearchSynthesizerAgent();
|
||||
const findings = agent.mechanicalSynthesize(tempDir);
|
||||
|
||||
const testingFindings = findings.filter((f) => f.topic.includes("testing strategy"));
|
||||
expect(testingFindings.length).toBeGreaterThanOrEqual(1);
|
||||
const refs = testingFindings[0].crossReferences;
|
||||
expect(refs).toContain("ARCHITECTURE.md");
|
||||
expect(refs).toContain("PROJECT.md");
|
||||
});
|
||||
|
||||
it("adds cross references between findings with shared topics", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciagentDir, "ARCHITECTURE.md"), "## API Layer\n\n- REST endpoints");
|
||||
fs.writeFileSync(path.join(ciagentDir, "REQUIREMENTS.md"), "## API Layer\n\n* Authentication");
|
||||
|
||||
const agent = new ResearchSynthesizerAgent();
|
||||
const findings = agent.mechanicalSynthesize(tempDir);
|
||||
|
||||
const apiFindings = findings.filter((f) => f.topic.includes("api layer"));
|
||||
expect(apiFindings.length).toBeGreaterThan(0);
|
||||
});
|
||||
|
||||
it("returns empty findings when no files exist", () => {
|
||||
const agent = new ResearchSynthesizerAgent();
|
||||
const findings = agent.mechanicalSynthesize(tempDir);
|
||||
|
||||
expect(findings).toEqual([]);
|
||||
});
|
||||
|
||||
it("agent name is research-synthesizer", () => {
|
||||
const agent = new ResearchSynthesizerAgent();
|
||||
expect(agent.name).toBe("research-synthesizer");
|
||||
});
|
||||
});
|
||||
@@ -1,5 +1,20 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface SynthesisFinding {
|
||||
source: "ARCHITECTURE.md" | "REQUIREMENTS.md" | "PROJECT.md" | "git_log";
|
||||
topic: string;
|
||||
summary: string;
|
||||
crossReferences: string[];
|
||||
}
|
||||
|
||||
const SOURCE_FILES: Array<{ file: string; source: SynthesisFinding["source"] }> = [
|
||||
{ file: "ARCHITECTURE.md", source: "ARCHITECTURE.md" },
|
||||
{ file: "REQUIREMENTS.md", source: "REQUIREMENTS.md" },
|
||||
{ file: "PROJECT.md", source: "PROJECT.md" },
|
||||
];
|
||||
|
||||
export class ResearchSynthesizerAgent extends BaseAgent {
|
||||
readonly name = "research-synthesizer";
|
||||
readonly description = "Synthesizes research files into a cohesive summary for roadmap creation.";
|
||||
@@ -8,6 +23,7 @@ export class ResearchSynthesizerAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Synthesizing research...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +31,113 @@ export class ResearchSynthesizerAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const findings = this.mechanicalSynthesize(context.project_path);
|
||||
const output = this.formatFindings(findings);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Research synthesis requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalSynthesize(projectPath: string): SynthesisFinding[] {
|
||||
const fileContents = this.readProjectFiles(projectPath);
|
||||
const allFindings = this.extractKeyStatements(fileContents);
|
||||
const merged = this.mergeOverlapping(allFindings);
|
||||
return this.addCrossReferences(merged);
|
||||
}
|
||||
|
||||
readProjectFiles(projectPath: string): Array<{ source: SynthesisFinding["source"]; content: string }> {
|
||||
const results: Array<{ source: SynthesisFinding["source"]; content: string }> = [];
|
||||
const ciagentDir = path.join(projectPath, ".ciagent");
|
||||
|
||||
for (const { file, source } of SOURCE_FILES) {
|
||||
const filePath = path.join(ciagentDir, file);
|
||||
if (fs.existsSync(filePath)) {
|
||||
results.push({ source, content: fs.readFileSync(filePath, "utf-8") });
|
||||
}
|
||||
}
|
||||
|
||||
return results;
|
||||
}
|
||||
|
||||
extractKeyStatements(fileContents: Array<{ source: SynthesisFinding["source"]; content: string }>): SynthesisFinding[] {
|
||||
const findings: SynthesisFinding[] = [];
|
||||
const topicPatterns = [
|
||||
/(?:^|\n)#{1,3}\s+(.+)/g,
|
||||
/(?:^|\n)\*\s+(.+)/g,
|
||||
/(?:^|\n)-\s+(.{5,80})/g,
|
||||
];
|
||||
|
||||
for (const { source, content } of fileContents) {
|
||||
if (!content.trim()) continue;
|
||||
for (const pattern of topicPatterns) {
|
||||
pattern.lastIndex = 0;
|
||||
let match;
|
||||
while ((match = pattern.exec(content)) !== null) {
|
||||
const topic = match[1].trim().replace(/[*`#]/g, "").substring(0, 80).trim();
|
||||
if (topic.length < 3) continue;
|
||||
findings.push({
|
||||
source,
|
||||
topic: topic.toLowerCase(),
|
||||
summary: topic,
|
||||
crossReferences: [],
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return findings;
|
||||
}
|
||||
|
||||
mergeOverlapping(findings: SynthesisFinding[]): SynthesisFinding[] {
|
||||
const merged: Map<string, SynthesisFinding> = new Map();
|
||||
for (const finding of findings) {
|
||||
const key = finding.topic;
|
||||
const existing = merged.get(key);
|
||||
if (existing) {
|
||||
if (!existing.crossReferences.includes(finding.source)) {
|
||||
existing.crossReferences.push(finding.source);
|
||||
}
|
||||
} else {
|
||||
merged.set(key, {
|
||||
...finding,
|
||||
crossReferences: [finding.source],
|
||||
});
|
||||
}
|
||||
}
|
||||
return Array.from(merged.values());
|
||||
}
|
||||
|
||||
addCrossReferences(findings: SynthesisFinding[]): SynthesisFinding[] {
|
||||
for (let i = 0; i < findings.length; i++) {
|
||||
for (let j = 0; j < findings.length; j++) {
|
||||
if (i === j) continue;
|
||||
const topicA = findings[i].topic.split(" ").slice(0, 2).join(" ");
|
||||
const topicB = findings[j].topic.split(" ").slice(0, 2).join(" ");
|
||||
if (topicA === topicB && !findings[i].crossReferences.includes(findings[j].source)) {
|
||||
findings[i].crossReferences.push(findings[j].source);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
const crossReferenced = findings.filter((f) => f.crossReferences.length > 1);
|
||||
const standalone = findings.filter((f) => f.crossReferences.length <= 1);
|
||||
return [...crossReferenced, ...standalone];
|
||||
}
|
||||
|
||||
private formatFindings(findings: SynthesisFinding[]): string {
|
||||
if (findings.length === 0) return "No findings synthesized — no project files found.";
|
||||
const lines: string[] = ["Synthesis Findings:", ""];
|
||||
for (const f of findings) {
|
||||
const refs = f.crossReferences.length > 0 ? f.crossReferences.join(", ") : "none";
|
||||
lines.push(`[${f.source}] ${f.summary} (refs: ${refs})`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,208 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { ResearcherAgent } from "../agents/researcher.js";
|
||||
import { AgentContext } from "../agents/base.js";
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult } from "../backends/types.js";
|
||||
import { emptyTokenUsage } from "../backends/types.js";
|
||||
|
||||
class MockBackend implements IntelligenceBackend {
|
||||
readonly name = "mock";
|
||||
readonly type = "llm" as const;
|
||||
async isAvailable(): Promise<boolean> { return true; }
|
||||
async execute(request: BackendRequest): Promise<BackendResult> {
|
||||
return {
|
||||
success: true,
|
||||
output: `Mock backend executed: ${request.task.slice(0, 50)}`,
|
||||
artifacts: [],
|
||||
decisions: [],
|
||||
escalations: [],
|
||||
usage: emptyTokenUsage(),
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
function createTempDir(): string {
|
||||
return fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-researcher-test-"));
|
||||
}
|
||||
|
||||
function cleanup(dir: string): void {
|
||||
fs.rmSync(dir, { recursive: true, force: true });
|
||||
}
|
||||
|
||||
function makeContext(dir: string, backend?: IntelligenceBackend): AgentContext {
|
||||
return {
|
||||
project_path: dir,
|
||||
phase: 1,
|
||||
stage: "research",
|
||||
specification: "Build a REST API for task management",
|
||||
config_path: path.join(dir, ".ciagent", "config.json"),
|
||||
backend,
|
||||
};
|
||||
}
|
||||
|
||||
function setupCIAgentDir(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
fs.mkdirSync(ciDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(ciDir, "config.json"), '{"projects":[],"active_project":""}');
|
||||
}
|
||||
|
||||
function writeProjectMd(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
const content = [
|
||||
"# Task API",
|
||||
"",
|
||||
"## What This Is",
|
||||
"",
|
||||
"A REST API for managing tasks",
|
||||
"",
|
||||
"## Requirements",
|
||||
"",
|
||||
"### Validated",
|
||||
"",
|
||||
"- ✓ User authentication",
|
||||
"",
|
||||
"### Active",
|
||||
"",
|
||||
"- [ ] Task CRUD",
|
||||
"",
|
||||
"### Out of Scope",
|
||||
"",
|
||||
"- Admin dashboard",
|
||||
"",
|
||||
"## Context",
|
||||
"",
|
||||
"Node.js project",
|
||||
"",
|
||||
"## Constraints",
|
||||
"",
|
||||
"- Must use Node.js",
|
||||
"",
|
||||
"## Key Decisions",
|
||||
"",
|
||||
"| Decision | Rationale | Outcome |",
|
||||
"|----------|-----------|---------|",
|
||||
].join("\n");
|
||||
fs.writeFileSync(path.join(ciDir, "PROJECT.md"), content);
|
||||
}
|
||||
|
||||
function writeArchitectureMd(dir: string): void {
|
||||
const ciDir = path.join(dir, ".ciagent");
|
||||
const content = [
|
||||
"# Architecture",
|
||||
"",
|
||||
"## Overview",
|
||||
"",
|
||||
"Task management system architecture",
|
||||
"",
|
||||
"## Components",
|
||||
"",
|
||||
"### Core",
|
||||
"- **Description**: Core module",
|
||||
"- **Boundaries**: src/core/ — internal module",
|
||||
"- **Depends on**: None",
|
||||
"",
|
||||
"## Data Flow",
|
||||
"",
|
||||
"Request → Handler → Service → Database",
|
||||
"",
|
||||
"## Build Order",
|
||||
"",
|
||||
"1. Build core module",
|
||||
].join("\n");
|
||||
fs.writeFileSync(path.join(ciDir, "ARCHITECTURE.md"), content);
|
||||
}
|
||||
|
||||
function setupSourceDir(dir: string): void {
|
||||
const srcDir = path.join(dir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.mkdirSync(path.join(srcDir, "core"), { recursive: true });
|
||||
fs.mkdirSync(path.join(srcDir, "agents"), { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "core", "index.ts"), "export {};\n");
|
||||
fs.writeFileSync(path.join(srcDir, "agents", "base.ts"), "export {};\n");
|
||||
}
|
||||
|
||||
describe("ResearcherAgent", () => {
|
||||
let dir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
dir = createTempDir();
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
cleanup(dir);
|
||||
});
|
||||
|
||||
it("reads .ciagent/ files without backend", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
writeProjectMd(dir);
|
||||
writeArchitectureMd(dir);
|
||||
|
||||
const researcher = new ResearcherAgent();
|
||||
const result = await researcher.execute(makeContext(dir));
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("findingsCount");
|
||||
});
|
||||
|
||||
it("only modifies .ciagent/ files", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
writeProjectMd(dir);
|
||||
writeArchitectureMd(dir);
|
||||
setupSourceDir(dir);
|
||||
|
||||
const srcDir = path.join(dir, "src");
|
||||
const filesBefore = new Set<string>();
|
||||
function collectFiles(d: string): void {
|
||||
for (const entry of fs.readdirSync(d, { withFileTypes: true })) {
|
||||
const full = path.join(d, entry.name);
|
||||
if (entry.isDirectory() && entry.name !== "node_modules") {
|
||||
collectFiles(full);
|
||||
} else {
|
||||
filesBefore.add(full);
|
||||
}
|
||||
}
|
||||
}
|
||||
collectFiles(srcDir);
|
||||
|
||||
const researcher = new ResearcherAgent();
|
||||
await researcher.execute(makeContext(dir));
|
||||
|
||||
collectFiles(srcDir);
|
||||
for (const f of filesBefore) {
|
||||
expect(fs.existsSync(f)).toBe(true);
|
||||
}
|
||||
});
|
||||
|
||||
it("updates ARCHITECTURE.md from source scan", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
writeProjectMd(dir);
|
||||
setupSourceDir(dir);
|
||||
|
||||
const researcher = new ResearcherAgent();
|
||||
const result = await researcher.execute(makeContext(dir));
|
||||
|
||||
if (result.success) {
|
||||
const parsed = JSON.parse(result.output);
|
||||
expect(parsed.filesUpdated).toContain(".ciagent/ARCHITECTURE.md");
|
||||
}
|
||||
});
|
||||
|
||||
it("delegates to backend when available", async () => {
|
||||
setupCIAgentDir(dir);
|
||||
const mockBackend = new MockBackend();
|
||||
const researcher = new ResearcherAgent();
|
||||
const result = await researcher.execute(makeContext(dir, mockBackend));
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("Mock backend executed");
|
||||
});
|
||||
|
||||
it("has correct agent name", () => {
|
||||
const researcher = new ResearcherAgent();
|
||||
expect(researcher.name).toBe("researcher");
|
||||
});
|
||||
|
||||
it("has correct workflow", () => {
|
||||
const researcher = new ResearcherAgent();
|
||||
expect(researcher.workflow).toBe("research");
|
||||
});
|
||||
});
|
||||
+240
-6
@@ -1,4 +1,20 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
import { GitContext } from "../core/git-context.js";
|
||||
import { CIAgentFiles, ArchitectureMd, ProjectMd } from "../core/ciagent-files.js";
|
||||
import { CommitBuilder } from "../core/commit-builder.js";
|
||||
import { CommitDecision } from "../types/commit-meta.js";
|
||||
import { fileExists, readFile } from "../utils/file.js";
|
||||
import { execSync } from "node:child_process";
|
||||
|
||||
export interface ResearcherResult {
|
||||
success: boolean;
|
||||
findingsCount: number;
|
||||
decisionsLogged: number;
|
||||
filesUpdated: string[];
|
||||
error?: string;
|
||||
}
|
||||
|
||||
export class ResearcherAgent extends BaseAgent {
|
||||
readonly name = "researcher";
|
||||
@@ -8,21 +24,239 @@ export class ResearcherAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Researching domain...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
`Research the domain for: ${context.specification}`
|
||||
`Research the domain for phase ${context.phase}. Specification: ${context.specification}. Read git history (last 50 commits), .ciagent/PROJECT.md, .ciagent/ARCHITECTURE.md, .ciagent/REQUIREMENTS.md. Scan src/ directory structure. Generate findings about module boundaries, risks, and approach. Update .ciagent/ARCHITECTURE.md with component boundary conclusions. Update .ciagent/PROJECT.md key decisions if warranted. Commit findings with CommitBuilder.buildResearchCommit().`
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const result = await this.runMechanicalResearch(context);
|
||||
const output = JSON.stringify(result, null, 2);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Research requires an intelligence backend. Configure one with: ci init --backend",
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
success: result.success,
|
||||
output,
|
||||
artifacts_created: result.filesUpdated,
|
||||
decisions: result.decisionsLogged,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: result.error,
|
||||
};
|
||||
}
|
||||
|
||||
private async runMechanicalResearch(context: AgentContext): Promise<ResearcherResult> {
|
||||
try {
|
||||
const gitContext = new GitContext(context.project_path);
|
||||
const ciFiles = new CIAgentFiles(context.project_path);
|
||||
|
||||
const findings: string[] = [];
|
||||
const decisions: CommitDecision[] = [];
|
||||
const filesUpdated: string[] = [];
|
||||
|
||||
const commits = gitContext.getRecentCommits(50);
|
||||
if (commits.length > 0) {
|
||||
findings.push(`Analyzed ${commits.length} recent commits for project history`);
|
||||
const researchCommits = commits.filter(c => c.ci?.status === "research");
|
||||
if (researchCommits.length > 0) {
|
||||
findings.push(`Found ${researchCommits.length} prior research commits`);
|
||||
}
|
||||
}
|
||||
|
||||
const projectMd = ciFiles.readProjectMd();
|
||||
if (projectMd) {
|
||||
findings.push(`Project: ${projectMd.name} — core value: ${projectMd.coreValue.slice(0, 80)}`);
|
||||
findings.push(`Active requirements: ${projectMd.requirements.active.length}, validated: ${projectMd.requirements.validated.length}`);
|
||||
} else {
|
||||
findings.push("No PROJECT.md found — project context unavailable");
|
||||
}
|
||||
|
||||
const archMd = ciFiles.readArchitectureMd();
|
||||
if (archMd) {
|
||||
findings.push(`Architecture: ${archMd.components.length} components, ${archMd.buildOrder.length} build steps`);
|
||||
for (const comp of archMd.components) {
|
||||
findings.push(` Component: ${comp.name} — boundaries: ${comp.boundaries.slice(0, 60)}, deps: ${comp.dependsOn.join(", ") || "none"}`);
|
||||
}
|
||||
} else {
|
||||
findings.push("No ARCHITECTURE.md found — architecture analysis unavailable");
|
||||
}
|
||||
|
||||
const reqsMd = ciFiles.readRequirementsMd();
|
||||
if (reqsMd) {
|
||||
const totalReqs = reqsMd.traceability.length;
|
||||
const covered = reqsMd.traceability.filter(t => t.status === "complete").length;
|
||||
const phaseReqs = reqsMd.traceability.filter(t => t.phase === context.phase);
|
||||
findings.push(`Requirements: ${totalReqs} total, ${covered} complete, ${phaseReqs.length} for phase ${context.phase}`);
|
||||
}
|
||||
|
||||
const srcDir = path.join(context.project_path, "src");
|
||||
if (fs.existsSync(srcDir)) {
|
||||
const moduleDirs = fs.readdirSync(srcDir, { withFileTypes: true })
|
||||
.filter(d => d.isDirectory() && d.name !== "node_modules")
|
||||
.map(d => d.name);
|
||||
findings.push(`Source modules: ${moduleDirs.join(", ")}`);
|
||||
|
||||
const updatedArch = this.deriveArchitectureFromSource(srcDir, archMd, moduleDirs);
|
||||
if (updatedArch) {
|
||||
ciFiles.writeArchitectureMd(updatedArch);
|
||||
filesUpdated.push(".ciagent/ARCHITECTURE.md");
|
||||
findings.push("Updated ARCHITECTURE.md with source-derived component boundaries");
|
||||
|
||||
decisions.push({
|
||||
id: `D-P${context.phase}-001`,
|
||||
decision: "Updated component boundaries from source scan",
|
||||
rationale: "Source directory structure reveals actual module boundaries",
|
||||
confidence: 0.75,
|
||||
alternatives: ["manual architecture review", "no update"],
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
if (projectMd && archMd) {
|
||||
const updatedProject = this.maybeUpdateKeyDecisions(projectMd, findings);
|
||||
if (updatedProject) {
|
||||
ciFiles.writeProjectMd(updatedProject, "research findings update");
|
||||
filesUpdated.push(".ciagent/PROJECT.md");
|
||||
findings.push("Updated PROJECT.md key decisions from research");
|
||||
|
||||
decisions.push({
|
||||
id: `D-P${context.phase}-002`,
|
||||
decision: "Logged research-based decisions to PROJECT.md",
|
||||
rationale: "Research findings warrant recording as key decisions",
|
||||
confidence: 0.70,
|
||||
alternatives: ["defer decision logging", "log after execution"],
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
this.commitFindings(context, findings, decisions);
|
||||
|
||||
return {
|
||||
success: true,
|
||||
findingsCount: findings.length,
|
||||
decisionsLogged: decisions.length,
|
||||
filesUpdated,
|
||||
};
|
||||
} catch (err) {
|
||||
return {
|
||||
success: false,
|
||||
findingsCount: 0,
|
||||
decisionsLogged: 0,
|
||||
filesUpdated: [],
|
||||
error: `Research failed: ${err instanceof Error ? err.message : String(err)}`,
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
private deriveArchitectureFromSource(srcDir: string, existing: ArchitectureMd | null, moduleDirs: string[]): ArchitectureMd | null {
|
||||
const newComponents = moduleDirs.map(dir => {
|
||||
const dirPath = path.join(srcDir, dir);
|
||||
const fileCount = this.countTsFiles(dirPath);
|
||||
const existingComp = existing?.components.find(c => c.name.toLowerCase() === dir.toLowerCase());
|
||||
|
||||
return {
|
||||
name: existingComp?.name || this.capitalize(dir),
|
||||
description: existingComp?.description || `${dir} module with ${fileCount} source files`,
|
||||
boundaries: existingComp?.boundaries || `src/${dir}/ — ${fileCount} files, internal module`,
|
||||
dependsOn: existingComp?.dependsOn || [],
|
||||
};
|
||||
});
|
||||
|
||||
if (existing) {
|
||||
const existingNames = new Set(existing.components.map(c => c.name.toLowerCase()));
|
||||
const hasNew = newComponents.some(c => !existingNames.has(c.name.toLowerCase()));
|
||||
if (!hasNew) {
|
||||
return {
|
||||
...existing,
|
||||
components: existing.components.map(comp => {
|
||||
const updated = newComponents.find(n => n.name.toLowerCase() === comp.name.toLowerCase());
|
||||
return updated || comp;
|
||||
}),
|
||||
};
|
||||
}
|
||||
|
||||
const merged = [...existing.components];
|
||||
for (const nc of newComponents) {
|
||||
if (!existingNames.has(nc.name.toLowerCase())) {
|
||||
merged.push(nc);
|
||||
}
|
||||
}
|
||||
return { ...existing, components: merged };
|
||||
}
|
||||
|
||||
return {
|
||||
overview: "Architecture derived from source directory scan",
|
||||
components: newComponents,
|
||||
dataFlow: "Modules communicate via typed interfaces and shared utilities",
|
||||
buildOrder: moduleDirs.map(d => `Build ${d} module`),
|
||||
};
|
||||
}
|
||||
|
||||
private maybeUpdateKeyDecisions(projectMd: ProjectMd, findings: string[]): ProjectMd | null {
|
||||
const researchDecisions = findings
|
||||
.filter(f => f.includes("Updated") || f.includes("Found") || f.includes("derived"))
|
||||
.map(f => ({
|
||||
decision: f.slice(0, 50),
|
||||
rationale: "Derived from mechanical source analysis",
|
||||
outcome: "logged by researcher",
|
||||
}));
|
||||
|
||||
if (researchDecisions.length === 0) return null;
|
||||
|
||||
const existingDecisions = projectMd.keyDecisions || [];
|
||||
const existingDecisionTexts = new Set(existingDecisions.map(d => d.decision));
|
||||
|
||||
const novelDecisions = researchDecisions.filter(d => !existingDecisionTexts.has(d.decision));
|
||||
if (novelDecisions.length === 0) return null;
|
||||
|
||||
return {
|
||||
...projectMd,
|
||||
keyDecisions: [...existingDecisions, ...novelDecisions],
|
||||
};
|
||||
}
|
||||
|
||||
private commitFindings(context: AgentContext, findings: string[], decisions: CommitDecision[]): void {
|
||||
try {
|
||||
const gitContext = new GitContext(context.project_path);
|
||||
const projectState = gitContext.reconstructState();
|
||||
const milestone = projectState.currentMilestone || "v1.0";
|
||||
|
||||
const commitMsg = CommitBuilder.buildResearchCommit(
|
||||
context.phase,
|
||||
milestone,
|
||||
`phase ${context.phase} domain research`,
|
||||
findings,
|
||||
decisions.length > 0 ? decisions : undefined,
|
||||
);
|
||||
|
||||
if (fileExists(path.join(context.project_path, ".git"))) {
|
||||
execSync(`git add -A && git commit -m "${commitMsg.replace(/"/g, '\\"')}" --allow-empty`, {
|
||||
cwd: context.project_path,
|
||||
stdio: "pipe",
|
||||
});
|
||||
}
|
||||
} catch (err) {
|
||||
this.warn(`Research commit failed: ${err instanceof Error ? err.message : String(err)}`);
|
||||
}
|
||||
}
|
||||
|
||||
private countTsFiles(dir: string): number {
|
||||
if (!fs.existsSync(dir)) return 0;
|
||||
let count = 0;
|
||||
const entries = fs.readdirSync(dir, { withFileTypes: true });
|
||||
for (const entry of entries) {
|
||||
if (entry.isDirectory() && entry.name !== "node_modules") {
|
||||
count += this.countTsFiles(path.join(dir, entry.name));
|
||||
} else if (entry.name.endsWith(".ts") && !entry.name.endsWith(".d.ts") && !entry.name.endsWith(".test.ts")) {
|
||||
count++;
|
||||
}
|
||||
}
|
||||
return count;
|
||||
}
|
||||
|
||||
private capitalize(s: string): string {
|
||||
return s.split("-").map(p => p.charAt(0).toUpperCase() + p.slice(1)).join("-");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,77 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { RoadmapperAgent } from "../agents/roadmapper.js";
|
||||
|
||||
describe("RoadmapperAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-roadmapper-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("generates phases from REQUIREMENTS.md", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(
|
||||
path.join(ciagentDir, "REQUIREMENTS.md"),
|
||||
"REQ-1: Phase: 1 — Build core\nREQ-2: Phase: 1 — Build utils\nREQ-3: Phase: 2 — Add features"
|
||||
);
|
||||
|
||||
const agent = new RoadmapperAgent();
|
||||
const phases = agent.mechanicalRoadmapGenerate(tempDir);
|
||||
|
||||
expect(phases.length).toBeGreaterThanOrEqual(2);
|
||||
expect(phases[0].requirements).toContain("REQ-1");
|
||||
expect(phases[0].requirements).toContain("REQ-2");
|
||||
expect(phases[1].requirements).toContain("REQ-3");
|
||||
});
|
||||
|
||||
it("sets phase dependencies correctly", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(
|
||||
path.join(ciagentDir, "REQUIREMENTS.md"),
|
||||
"REQ-1: Phase: 1 — Core\nREQ-2: Phase: 2 — Extension"
|
||||
);
|
||||
|
||||
const agent = new RoadmapperAgent();
|
||||
const phases = agent.mechanicalRoadmapGenerate(tempDir);
|
||||
|
||||
expect(phases.length).toBe(2);
|
||||
expect(phases[0].dependencies).toEqual([]);
|
||||
expect(phases[1].dependencies).toEqual([1]);
|
||||
});
|
||||
|
||||
it("generates success criteria from requirements", () => {
|
||||
const ciagentDir = path.join(tempDir, ".ciagent");
|
||||
fs.mkdirSync(ciagentDir, { recursive: true });
|
||||
fs.writeFileSync(
|
||||
path.join(ciagentDir, "REQUIREMENTS.md"),
|
||||
"REQ-1: Phase: 1 — Build core"
|
||||
);
|
||||
|
||||
const agent = new RoadmapperAgent();
|
||||
const phases = agent.mechanicalRoadmapGenerate(tempDir);
|
||||
|
||||
expect(phases.length).toBe(1);
|
||||
expect(phases[0].successCriteria.length).toBeGreaterThan(0);
|
||||
expect(phases[0].successCriteria.some((c) => c.includes("REQ-1"))).toBe(true);
|
||||
});
|
||||
|
||||
it("returns empty when no REQUIREMENTS.md exists", () => {
|
||||
const agent = new RoadmapperAgent();
|
||||
const phases = agent.mechanicalRoadmapGenerate(tempDir);
|
||||
|
||||
expect(phases).toEqual([]);
|
||||
});
|
||||
|
||||
it("agent name is roadmapper", () => {
|
||||
const agent = new RoadmapperAgent();
|
||||
expect(agent.name).toBe("roadmapper");
|
||||
});
|
||||
});
|
||||
+110
-3
@@ -1,5 +1,16 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface PhaseDefinition {
|
||||
number: number;
|
||||
name: string;
|
||||
description: string;
|
||||
requirements: string[];
|
||||
dependencies: number[];
|
||||
successCriteria: string[];
|
||||
}
|
||||
|
||||
export class RoadmapperAgent extends BaseAgent {
|
||||
readonly name = "roadmapper";
|
||||
readonly description = "Creates and maintains project roadmaps.";
|
||||
@@ -8,6 +19,7 @@ export class RoadmapperAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Creating roadmap...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +27,109 @@ export class RoadmapperAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const phases = this.mechanicalRoadmapGenerate(context.project_path);
|
||||
const output = this.formatPhases(phases);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Roadmap creation requires an intelligence backend.",
|
||||
success: true,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalRoadmapGenerate(projectPath: string): PhaseDefinition[] {
|
||||
const requirements = this.readRequirements(projectPath);
|
||||
const grouped = this.groupRequirementsByPhase(requirements);
|
||||
const phases = this.assignPhases(grouped);
|
||||
return phases.map((phase) => ({
|
||||
...phase,
|
||||
successCriteria: this.generateSuccessCriteria(phase),
|
||||
}));
|
||||
}
|
||||
|
||||
readRequirements(projectPath: string): Array<{ id: string; phase: number; text: string }> {
|
||||
const reqPath = path.join(projectPath, ".ciagent", "REQUIREMENTS.md");
|
||||
if (!fs.existsSync(reqPath)) return [];
|
||||
|
||||
const content = fs.readFileSync(reqPath, "utf-8");
|
||||
const requirements: Array<{ id: string; phase: number; text: string }> = [];
|
||||
|
||||
const reqBlockRegex = /REQ-(\d+)[^]*?(?=REQ-\d+|$)/g;
|
||||
let match;
|
||||
while ((match = reqBlockRegex.exec(content)) !== null) {
|
||||
const block = match[0];
|
||||
const id = `REQ-${match[1]}`;
|
||||
const phaseMatch = block.match(/phase[:\s]+(\d+)/i);
|
||||
const phase = phaseMatch ? parseInt(phaseMatch[1], 10) : 1;
|
||||
const textMatch = block.match(/(?:title|description|requirement)[:\s]+(.+)/i);
|
||||
const text = textMatch ? textMatch[1].trim() : id;
|
||||
requirements.push({ id, phase, text });
|
||||
}
|
||||
|
||||
return requirements;
|
||||
}
|
||||
|
||||
groupRequirementsByPhase(requirements: Array<{ id: string; phase: number; text: string }>): Record<number, Array<{ id: string; text: string }>> {
|
||||
const groups: Record<number, Array<{ id: string; text: string }>> = {};
|
||||
for (const req of requirements) {
|
||||
if (!groups[req.phase]) {
|
||||
groups[req.phase] = [];
|
||||
}
|
||||
groups[req.phase].push({ id: req.id, text: req.text });
|
||||
}
|
||||
return groups;
|
||||
}
|
||||
|
||||
assignPhases(grouped: Record<number, Array<{ id: string; text: string }>>): PhaseDefinition[] {
|
||||
const phaseNumbers = Object.keys(grouped).map(Number).sort((a, b) => a - b);
|
||||
if (phaseNumbers.length === 0) return [];
|
||||
|
||||
return phaseNumbers.map((num, idx) => {
|
||||
const reqs = grouped[num];
|
||||
const dependencies = idx === 0 ? [] : [phaseNumbers[idx - 1]];
|
||||
return {
|
||||
number: num,
|
||||
name: `Phase ${num}`,
|
||||
description: `Implementation phase ${num} covering ${reqs.length} requirement(s).`,
|
||||
requirements: reqs.map((r) => r.id),
|
||||
dependencies,
|
||||
successCriteria: [],
|
||||
};
|
||||
});
|
||||
}
|
||||
|
||||
generateSuccessCriteria(phase: PhaseDefinition): string[] {
|
||||
const criteria: string[] = [];
|
||||
for (const reqId of phase.requirements) {
|
||||
criteria.push(`${reqId} fully implemented and verified`);
|
||||
}
|
||||
if (phase.requirements.length > 0) {
|
||||
criteria.push("All tests passing for phase requirements");
|
||||
}
|
||||
if (phase.dependencies.length > 0) {
|
||||
criteria.push(`Phase ${phase.dependencies[0]} completion confirmed`);
|
||||
}
|
||||
return criteria;
|
||||
}
|
||||
|
||||
private formatPhases(phases: PhaseDefinition[]): string {
|
||||
if (phases.length === 0) return "No phases generated — no requirements found.";
|
||||
const lines: string[] = ["Roadmap:", ""];
|
||||
for (const phase of phases) {
|
||||
lines.push(`Phase ${phase.number}: ${phase.name}`);
|
||||
lines.push(` Description: ${phase.description}`);
|
||||
lines.push(` Requirements: ${phase.requirements.join(", ") || "none"}`);
|
||||
lines.push(` Dependencies: ${phase.dependencies.map(String).join(", ") || "none"}`);
|
||||
lines.push(` Success Criteria:`);
|
||||
for (const criterion of phase.successCriteria) {
|
||||
lines.push(` - ${criterion}`);
|
||||
}
|
||||
lines.push("");
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,69 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { SecurityAuditorAgent } from "../agents/security-auditor.js";
|
||||
|
||||
describe("SecurityAuditorAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-sec-auditor-test-"));
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("finds hardcoded passwords via mechanical audit", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "config.ts"), 'const password = "secret123";');
|
||||
|
||||
const agent = new SecurityAuditorAgent();
|
||||
const findings = agent.mechanicalAudit(tempDir);
|
||||
|
||||
expect(findings.length).toBeGreaterThan(0);
|
||||
expect(findings[0].stride_category).toBe("information_disclosure");
|
||||
expect(findings[0].cwe).toContain("CWE-");
|
||||
expect(findings[0].severity).toBe("high");
|
||||
});
|
||||
|
||||
it("finds empty catch blocks as repudiation", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "err.ts"), 'try { work(); } catch(e) {}');
|
||||
|
||||
const agent = new SecurityAuditorAgent();
|
||||
const findings = agent.mechanicalAudit(tempDir);
|
||||
|
||||
const repudiation = findings.filter((f) => f.stride_category === "repudiation");
|
||||
expect(repudiation.length).toBeGreaterThan(0);
|
||||
});
|
||||
|
||||
it("returns empty findings for clean code", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "app.ts"), 'export function main() { return 1; }');
|
||||
|
||||
const agent = new SecurityAuditorAgent();
|
||||
const findings = agent.mechanicalAudit(tempDir);
|
||||
|
||||
expect(findings).toHaveLength(0);
|
||||
});
|
||||
|
||||
it("applies confidence-based disposition", () => {
|
||||
const srcDir = path.join(tempDir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "api.ts"), 'const api_key = "abc123";');
|
||||
|
||||
const agent = new SecurityAuditorAgent(0.5);
|
||||
const findings = agent.mechanicalAudit(tempDir);
|
||||
|
||||
expect(findings.some((f) => f.disposition === "flag")).toBe(true);
|
||||
});
|
||||
|
||||
it("agent name is security-auditor", () => {
|
||||
const agent = new SecurityAuditorAgent();
|
||||
expect(agent.name).toBe("security-auditor");
|
||||
});
|
||||
});
|
||||
@@ -1,13 +1,52 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface SecurityFinding {
|
||||
stride_category: string;
|
||||
cwe: string;
|
||||
severity: "low" | "medium" | "high";
|
||||
disposition: "accept" | "mitigate" | "flag";
|
||||
file: string;
|
||||
description: string;
|
||||
}
|
||||
|
||||
const SECURITY_PATTERNS: Array<{
|
||||
pattern: RegExp;
|
||||
category: string;
|
||||
cwe: string;
|
||||
description: string;
|
||||
severity: "low" | "medium" | "high";
|
||||
confidence: number;
|
||||
}> = [
|
||||
{ pattern: /password\s*=\s*['"][^'"]+['"]/gi, category: "information_disclosure", cwe: "CWE-259", description: "Hardcoded password", severity: "high", confidence: 0.95 },
|
||||
{ pattern: /api[_-]?key\s*=\s*['"][^'"]+['"]/gi, category: "information_disclosure", cwe: "CWE-312", description: "Hardcoded API key", severity: "high", confidence: 0.95 },
|
||||
{ pattern: /secret\s*=\s*['"][^'"]+['"]/gi, category: "information_disclosure", cwe: "CWE-312", description: "Hardcoded secret", severity: "high", confidence: 0.95 },
|
||||
{ pattern: /token\s*=\s*['"][^'"]+['"]/gi, category: "information_disclosure", cwe: "CWE-312", description: "Hardcoded token", severity: "medium", confidence: 0.80 },
|
||||
{ pattern: /eval\s*\(\s*[^'"]*\$\{/g, category: "tampering", cwe: "CWE-94", description: "eval() with dynamic content", severity: "high", confidence: 0.90 },
|
||||
{ pattern: /(?:exec|execSync|spawn|spawnSync)\s*\(\s*[^'"]*[\$`]/g, category: "elevation_of_privilege", cwe: "CWE-78", description: "Command execution with interpolation", severity: "high", confidence: 0.85 },
|
||||
{ pattern: /catch\s*\(\w*\)\s*\{\s*\}/g, category: "repudiation", cwe: "CWE-778", description: "Empty catch block", severity: "medium", confidence: 0.85 },
|
||||
{ pattern: /jwt\.decode\s*\(/g, category: "spoofing", cwe: "CWE-287", description: "JWT decode without verify", severity: "high", confidence: 0.85 },
|
||||
{ pattern: /(?:__proto__|constructor\s*\[|prototype\s*\[)/g, category: "elevation_of_privilege", cwe: "CWE-1321", description: "Prototype pollution", severity: "high", confidence: 0.90 },
|
||||
{ pattern: /(?:md5|sha1|des|rc4)\s*\(/gi, category: "information_disclosure", cwe: "CWE-328", description: "Weak crypto", severity: "medium", confidence: 0.90 },
|
||||
{ pattern: /express\.json\s*\(\s*\)/g, category: "denial_of_service", cwe: "CWE-400", description: "JSON parser without size limit", severity: "medium", confidence: 0.80 },
|
||||
];
|
||||
|
||||
export class SecurityAuditorAgent extends BaseAgent {
|
||||
readonly name = "security-auditor";
|
||||
readonly description = "Auto-dispositions threats: low=accept, medium=mitigate, high=escalate.";
|
||||
readonly workflow = "verify";
|
||||
private confidenceThreshold: number;
|
||||
|
||||
constructor(confidenceThreshold: number = 0.6) {
|
||||
super();
|
||||
this.confidenceThreshold = confidenceThreshold;
|
||||
}
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Running security audit...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +54,74 @@ export class SecurityAuditorAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const findings = this.mechanicalAudit(context.project_path);
|
||||
const highCount = findings.filter((f) => f.severity === "high").length;
|
||||
const output = this.formatFindings(findings);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Security auditing requires an intelligence backend. Configure one with: ci init --backend",
|
||||
success: highCount === 0,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
escalations: highCount,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
error: highCount > 0 ? `${highCount} high-severity finding(s) require escalation` : undefined,
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalAudit(projectPath: string): SecurityFinding[] {
|
||||
const findings: SecurityFinding[] = [];
|
||||
const srcDir = path.join(projectPath, "src");
|
||||
|
||||
if (!fs.existsSync(srcDir)) return findings;
|
||||
|
||||
this.scanDirectory(srcDir, projectPath, findings);
|
||||
return findings;
|
||||
}
|
||||
|
||||
private getDisposition(severity: SecurityFinding["severity"], confidence: number): SecurityFinding["disposition"] {
|
||||
if (severity === "low") return "accept";
|
||||
if (confidence >= this.confidenceThreshold) return "flag";
|
||||
return "mitigate";
|
||||
}
|
||||
|
||||
private scanDirectory(dir: string, projectPath: string, findings: SecurityFinding[]): void {
|
||||
const entries = fs.readdirSync(dir, { withFileTypes: true });
|
||||
for (const entry of entries) {
|
||||
const fullPath = path.join(dir, entry.name);
|
||||
if (entry.isDirectory() && entry.name !== "node_modules" && entry.name !== ".git") {
|
||||
this.scanDirectory(fullPath, projectPath, findings);
|
||||
} else if (
|
||||
entry.isFile() &&
|
||||
(entry.name.endsWith(".ts") || entry.name.endsWith(".js")) &&
|
||||
!entry.name.endsWith(".test.ts") &&
|
||||
!entry.name.endsWith(".d.ts")
|
||||
) {
|
||||
const content = fs.readFileSync(fullPath, "utf-8");
|
||||
for (const { pattern, category, cwe, description, severity, confidence } of SECURITY_PATTERNS) {
|
||||
pattern.lastIndex = 0;
|
||||
if (pattern.test(content)) {
|
||||
findings.push({
|
||||
stride_category: category,
|
||||
cwe,
|
||||
severity,
|
||||
disposition: this.getDisposition(severity, confidence),
|
||||
file: path.relative(projectPath, fullPath),
|
||||
description,
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
private formatFindings(findings: SecurityFinding[]): string {
|
||||
if (findings.length === 0) return "No security findings — audit passed.";
|
||||
const lines: string[] = ["Security Audit Findings:", ""];
|
||||
for (const f of findings) {
|
||||
lines.push(`[${f.stride_category}|${f.cwe}|${f.disposition}] ${f.severity.toUpperCase()}: ${f.description} (${f.file})`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,89 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { SolutionWriterAgent } from "../agents/solution-writer.js";
|
||||
|
||||
describe("SolutionWriterAgent", () => {
|
||||
let tempDir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-solution-writer-test-"));
|
||||
fs.mkdirSync(path.join(tempDir, ".ciagent"), { recursive: true });
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
fs.rmSync(tempDir, { recursive: true, force: true });
|
||||
});
|
||||
|
||||
it("reads PLAN.md and produces implementation plan section", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "PLAN.md"),
|
||||
"# Plan\n\n| T-01 | Setup | 1 | none | Files exist | REQ-01 |\n|-----|-------|---|------|------------|--------|\n"
|
||||
);
|
||||
|
||||
const agent = new SolutionWriterAgent();
|
||||
const result = agent.mechanicalSolutionWrite(tempDir);
|
||||
|
||||
expect(result).toContain("# Solution Document");
|
||||
expect(result).toContain("## Implementation Plan");
|
||||
expect(result).toContain("T-01");
|
||||
});
|
||||
|
||||
it("reads REQUIREMENTS.md and extracts verification criteria", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "REQUIREMENTS.md"),
|
||||
"# Requirements\n\nREQ-01: System must boot\nREQ-02: System must respond\n"
|
||||
);
|
||||
|
||||
const agent = new SolutionWriterAgent();
|
||||
const result = agent.mechanicalSolutionWrite(tempDir);
|
||||
|
||||
expect(result).toContain("## Verification Criteria");
|
||||
expect(result).toContain("REQ-01");
|
||||
expect(result).toContain("REQ-02");
|
||||
});
|
||||
|
||||
it("reads ARCHITECTURE.md and populates approach and risk sections", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "ARCHITECTURE.md"),
|
||||
"# Architecture\n\n## Approach\n\nModular monolith with clear boundaries.\n\n## Risks\n\n- Single point of failure in gateway\n"
|
||||
);
|
||||
|
||||
const agent = new SolutionWriterAgent();
|
||||
const result = agent.mechanicalSolutionWrite(tempDir);
|
||||
|
||||
expect(result).toContain("## Approach");
|
||||
expect(result).toContain("Modular monolith");
|
||||
expect(result).toContain("## Risk Assessment");
|
||||
expect(result).toContain("gateway");
|
||||
});
|
||||
|
||||
it("produces structured markdown with all five sections", () => {
|
||||
const agent = new SolutionWriterAgent();
|
||||
const result = agent.mechanicalSolutionWrite(tempDir);
|
||||
|
||||
expect(result).toContain("# Solution Document");
|
||||
expect(result).toContain("## Problem Statement");
|
||||
expect(result).toContain("## Approach");
|
||||
expect(result).toContain("## Implementation Plan");
|
||||
expect(result).toContain("## Verification Criteria");
|
||||
expect(result).toContain("## Risk Assessment");
|
||||
});
|
||||
|
||||
it("extracts problem statement from requirements objective section", () => {
|
||||
fs.writeFileSync(
|
||||
path.join(tempDir, ".ciagent", "REQUIREMENTS.md"),
|
||||
"# Objective\n\nBuild a fast CLI tool.\n\n## Requirements\n\nREQ-01: Speed"
|
||||
);
|
||||
|
||||
const agent = new SolutionWriterAgent();
|
||||
const result = agent.mechanicalSolutionWrite(tempDir);
|
||||
|
||||
expect(result).toContain("Build a fast CLI tool");
|
||||
});
|
||||
|
||||
it("agent name is solution-writer", () => {
|
||||
const agent = new SolutionWriterAgent();
|
||||
expect(agent.name).toBe("solution-writer");
|
||||
});
|
||||
});
|
||||
@@ -1,5 +1,12 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
|
||||
interface SolutionSection {
|
||||
title: string;
|
||||
content: string;
|
||||
}
|
||||
|
||||
export class SolutionWriterAgent extends BaseAgent {
|
||||
readonly name = "solution-writer";
|
||||
readonly description = "Produces structured solution documents.";
|
||||
@@ -8,6 +15,7 @@ export class SolutionWriterAgent extends BaseAgent {
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Writing solution document...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
@@ -15,14 +23,202 @@ export class SolutionWriterAgent extends BaseAgent {
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const document = this.mechanicalSolutionWrite(context.project_path);
|
||||
|
||||
return {
|
||||
success: false,
|
||||
output: "Solution writing requires an intelligence backend.",
|
||||
success: true,
|
||||
output: document,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: 0,
|
||||
duration_ms: Date.now() - start,
|
||||
error: "No intelligence backend available",
|
||||
};
|
||||
}
|
||||
|
||||
mechanicalSolutionWrite(projectPath: string): string {
|
||||
const plan = this.readPlan(projectPath);
|
||||
const requirements = this.readRequirements(projectPath);
|
||||
const architecture = this.readArchitecture(projectPath);
|
||||
|
||||
const sections: SolutionSection[] = [
|
||||
{ title: "Problem Statement", content: this.extractProblemStatement(requirements, plan) },
|
||||
{ title: "Approach", content: this.extractApproach(requirements, architecture) },
|
||||
{ title: "Implementation Plan", content: this.extractImplementationPlan(plan) },
|
||||
{ title: "Verification Criteria", content: this.extractVerificationCriteria(requirements) },
|
||||
{ title: "Risk Assessment", content: this.extractRiskAssessment(architecture) },
|
||||
];
|
||||
|
||||
return this.fillTemplate(sections);
|
||||
}
|
||||
|
||||
readPlan(projectPath: string): string {
|
||||
const planPath = path.join(projectPath, ".ciagent", "PLAN.md");
|
||||
if (!fs.existsSync(planPath)) return "";
|
||||
try {
|
||||
return fs.readFileSync(planPath, "utf-8");
|
||||
} catch {
|
||||
return "";
|
||||
}
|
||||
}
|
||||
|
||||
readRequirements(projectPath: string): string {
|
||||
const reqPath = path.join(projectPath, ".ciagent", "REQUIREMENTS.md");
|
||||
if (!fs.existsSync(reqPath)) return "";
|
||||
try {
|
||||
return fs.readFileSync(reqPath, "utf-8");
|
||||
} catch {
|
||||
return "";
|
||||
}
|
||||
}
|
||||
|
||||
readArchitecture(projectPath: string): string {
|
||||
const archPath = path.join(projectPath, ".ciagent", "ARCHITECTURE.md");
|
||||
if (!fs.existsSync(archPath)) return "";
|
||||
try {
|
||||
return fs.readFileSync(archPath, "utf-8");
|
||||
} catch {
|
||||
return "";
|
||||
}
|
||||
}
|
||||
|
||||
fillTemplate(sections: SolutionSection[]): string {
|
||||
const lines: string[] = ["# Solution Document", ""];
|
||||
|
||||
for (const section of sections) {
|
||||
lines.push(`## ${section.title}`);
|
||||
lines.push("");
|
||||
if (section.content.trim()) {
|
||||
lines.push(section.content.trim());
|
||||
} else {
|
||||
lines.push(`_No ${section.title.toLowerCase()} information available._`);
|
||||
}
|
||||
lines.push("");
|
||||
}
|
||||
|
||||
return lines.join("\n");
|
||||
}
|
||||
|
||||
extractSectionContent(content: string, headingPatterns: string[]): string {
|
||||
if (!content.trim()) return "";
|
||||
const sections = content.split(/(?=^#{1,3}\s)/m).filter((s) => s.trim());
|
||||
for (const section of sections) {
|
||||
for (const pattern of headingPatterns) {
|
||||
if (section.toLowerCase().startsWith(pattern.toLowerCase())) {
|
||||
const lines = section.split("\n");
|
||||
return lines.slice(1).join("\n").trim();
|
||||
}
|
||||
}
|
||||
}
|
||||
return "";
|
||||
}
|
||||
|
||||
extractProblemStatement(requirements: string, plan: string): string {
|
||||
const content = this.extractSectionContent(requirements, ["# objective", "## objective", "# problem", "## problem", "# goal", "## goal"]);
|
||||
if (content) return content;
|
||||
|
||||
const planContent = this.extractSectionContent(plan, ["# objective", "## objective", "# problem", "## problem", "# goal", "## goal"]);
|
||||
if (planContent) return planContent;
|
||||
|
||||
const firstReq = requirements.match(/-?\s*(REQ-\d+[:\s]+)/g);
|
||||
if (firstReq) {
|
||||
return "Requirements to address: " + firstReq.map((m) => m.trim()).join(", ");
|
||||
}
|
||||
|
||||
if (requirements || plan) {
|
||||
const src = requirements || plan;
|
||||
const firstParagraph = src.split("\n\n")[0]?.trim();
|
||||
if (firstParagraph && !firstParagraph.startsWith("#")) return firstParagraph;
|
||||
}
|
||||
|
||||
return "No problem statement could be extracted from project files.";
|
||||
}
|
||||
|
||||
extractApproach(requirements: string, architecture: string): string {
|
||||
const archContent = this.extractSectionContent(architecture, ["## approach", "### approach", "## design", "### design", "## architecture overview"]);
|
||||
if (archContent) return archContent;
|
||||
|
||||
const reqContent = this.extractSectionContent(requirements, ["## approach", "### approach", "## design", "### design"]);
|
||||
if (reqContent) return reqContent;
|
||||
|
||||
const compContent = this.extractSectionContent(architecture, ["## components", "### components"]);
|
||||
if (compContent) return "Architecture-based approach: " + compContent.substring(0, 200);
|
||||
|
||||
if (architecture) {
|
||||
const firstParagraph = architecture.split("\n\n")[0]?.trim();
|
||||
if (firstParagraph && !firstParagraph.startsWith("#")) return firstParagraph;
|
||||
}
|
||||
|
||||
return "No approach information could be extracted from project files.";
|
||||
}
|
||||
|
||||
extractImplementationPlan(plan: string): string {
|
||||
if (!plan.trim()) return "No implementation plan available — PLAN.md not found.";
|
||||
|
||||
const taskPattern = plan.match(/\|\s*T-\d+.*\|/g);
|
||||
if (taskPattern) {
|
||||
const lines: string[] = ["Tasks from plan:"];
|
||||
for (const task of taskPattern) {
|
||||
lines.push(` ${task.trim()}`);
|
||||
}
|
||||
return lines.join("\n");
|
||||
}
|
||||
|
||||
const waveSections = plan.split(/(?=^#{1,3}\s+Wave\s)/mi).filter((s) => s.trim());
|
||||
if (waveSections.length > 1) {
|
||||
const lines: string[] = [];
|
||||
for (const wave of waveSections.slice(1)) {
|
||||
lines.push(wave.trim());
|
||||
}
|
||||
return lines.join("\n\n");
|
||||
}
|
||||
|
||||
const sections = plan.split(/(?=^#{1,3}\s)/m).filter((s) => s.trim());
|
||||
const lines: string[] = [];
|
||||
for (const section of sections.slice(0, 5)) {
|
||||
lines.push(section.trim());
|
||||
}
|
||||
return lines.join("\n\n");
|
||||
}
|
||||
|
||||
extractVerificationCriteria(requirements: string): string {
|
||||
const lines: string[] = [];
|
||||
|
||||
const reqIds = requirements.match(/REQ-\d+/g);
|
||||
if (reqIds) {
|
||||
const uniqueIds = [...new Set(reqIds)];
|
||||
lines.push("Requirements coverage:");
|
||||
for (const id of uniqueIds) {
|
||||
lines.push(` - ${id}: verified`);
|
||||
}
|
||||
}
|
||||
|
||||
const verContent = this.extractSectionContent(requirements, ["## verification", "### verification", "## acceptance", "### acceptance", "## testing", "### testing"]);
|
||||
if (verContent) {
|
||||
lines.push(verContent);
|
||||
}
|
||||
|
||||
if (lines.length === 0) lines.push("No verification criteria extracted — add requirements with REQ-IDs or a Verification section.");
|
||||
|
||||
return lines.join("\n\n");
|
||||
}
|
||||
|
||||
extractRiskAssessment(architecture: string): string {
|
||||
const lines: string[] = [];
|
||||
|
||||
const riskContent = this.extractSectionContent(architecture, ["## risk", "### risk", "## risks", "### risks", "## concern", "## mitigation"]);
|
||||
if (riskContent) {
|
||||
lines.push(riskContent);
|
||||
}
|
||||
|
||||
const depContent = this.extractSectionContent(architecture, ["## dependencies", "### dependencies", "## external", "### external"]);
|
||||
if (depContent) {
|
||||
lines.push("Dependency risks:");
|
||||
lines.push(depContent);
|
||||
}
|
||||
|
||||
if (lines.length === 0) lines.push("No risks identified — review architecture for potential concerns.");
|
||||
|
||||
return lines.join("\n\n");
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,94 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import * as os from "node:os";
|
||||
import { TesterAgent } from "../agents/tester.js";
|
||||
import { AgentContext } from "../agents/base.js";
|
||||
import { IntelligenceBackend, BackendRequest, BackendResult } from "../backends/types.js";
|
||||
import { emptyTokenUsage } from "../backends/types.js";
|
||||
|
||||
class MockBackend implements IntelligenceBackend {
|
||||
readonly name = "mock";
|
||||
readonly type = "llm" as const;
|
||||
async isAvailable(): Promise<boolean> { return true; }
|
||||
async execute(request: BackendRequest): Promise<BackendResult> {
|
||||
return {
|
||||
success: true,
|
||||
output: `Mock backend executed: ${request.task.slice(0, 50)}`,
|
||||
artifacts: [],
|
||||
decisions: [],
|
||||
escalations: [],
|
||||
usage: emptyTokenUsage(),
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
function createTempDir(): string {
|
||||
return fs.mkdtempSync(path.join(os.tmpdir(), "ciagent-tester-test-"));
|
||||
}
|
||||
|
||||
function cleanup(dir: string): void {
|
||||
fs.rmSync(dir, { recursive: true, force: true });
|
||||
}
|
||||
|
||||
function makeContext(dir: string, backend?: IntelligenceBackend): AgentContext {
|
||||
return {
|
||||
project_path: dir,
|
||||
phase: 1,
|
||||
stage: "test",
|
||||
specification: "Build a REST API for task management",
|
||||
config_path: path.join(dir, ".ciagent", "config.json"),
|
||||
backend,
|
||||
};
|
||||
}
|
||||
|
||||
describe("TesterAgent", () => {
|
||||
let dir: string;
|
||||
|
||||
beforeEach(() => {
|
||||
dir = createTempDir();
|
||||
});
|
||||
|
||||
afterEach(() => {
|
||||
cleanup(dir);
|
||||
});
|
||||
|
||||
it("detects test files when src directory exists", async () => {
|
||||
const srcDir = path.join(dir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "app.integration.test.ts"), "test('integration', () => {});\n");
|
||||
|
||||
const tester = new TesterAgent();
|
||||
const result = await tester.execute(makeContext(dir));
|
||||
expect(result.success).toBeDefined();
|
||||
});
|
||||
|
||||
it("does not write test files", async () => {
|
||||
const srcDir = path.join(dir, "src");
|
||||
fs.mkdirSync(srcDir, { recursive: true });
|
||||
fs.writeFileSync(path.join(srcDir, "app.test.ts"), "test('unit', () => {});\n");
|
||||
|
||||
const testFilesBefore = fs.readdirSync(srcDir).filter(f => f.endsWith(".test.ts"));
|
||||
const tester = new TesterAgent();
|
||||
await tester.execute(makeContext(dir));
|
||||
const testFilesAfter = fs.readdirSync(srcDir).filter(f => f.endsWith(".test.ts"));
|
||||
expect(testFilesAfter.length).toBe(testFilesBefore.length);
|
||||
});
|
||||
|
||||
it("delegates to backend when available", async () => {
|
||||
const mockBackend = new MockBackend();
|
||||
const tester = new TesterAgent();
|
||||
const result = await tester.execute(makeContext(dir, mockBackend));
|
||||
expect(result.success).toBe(true);
|
||||
expect(result.output).toContain("Mock backend executed");
|
||||
});
|
||||
|
||||
it("has correct agent name", () => {
|
||||
const tester = new TesterAgent();
|
||||
expect(tester.name).toBe("tester");
|
||||
});
|
||||
|
||||
it("has correct workflow", () => {
|
||||
const tester = new TesterAgent();
|
||||
expect(tester.workflow).toBe("test");
|
||||
});
|
||||
});
|
||||
@@ -0,0 +1,181 @@
|
||||
import * as fs from "node:fs";
|
||||
import * as path from "node:path";
|
||||
import { BaseAgent, AgentContext, AgentResult } from "./base.js";
|
||||
import { execSync } from "node:child_process";
|
||||
|
||||
export interface TesterResult {
|
||||
success: boolean;
|
||||
integrationTestsFound: number;
|
||||
integrationTestsPassed: number;
|
||||
e2eTestsFound: number;
|
||||
e2eTestsPassed: number;
|
||||
overallPassed: boolean;
|
||||
error?: string;
|
||||
}
|
||||
|
||||
export class TesterAgent extends BaseAgent {
|
||||
readonly name = "tester";
|
||||
readonly description = "Runs integration, e2e, functional tests. Validates non-unit test coverage.";
|
||||
readonly workflow = "test";
|
||||
|
||||
async execute(context: AgentContext): Promise<AgentResult> {
|
||||
const start = Date.now();
|
||||
this.log("Running automated tests...");
|
||||
|
||||
if (context.backend) {
|
||||
const result = await this.executeViaBackend(
|
||||
context,
|
||||
`Run integration, e2e, and functional tests for phase ${context.phase}. Specification: ${context.specification}. Detect *.integration.test.ts, *.e2e.test.ts, *.functional.test.ts files. Run npm test. Parse output for pass/fail counts per category. Report structured TesterResult. Do NOT write any test files — only detect and run existing ones.`
|
||||
);
|
||||
return { ...result, duration_ms: Date.now() - start };
|
||||
}
|
||||
|
||||
const result = await this.runMechanicalTests(context);
|
||||
const output = JSON.stringify(result, null, 2);
|
||||
|
||||
return {
|
||||
success: result.success,
|
||||
output,
|
||||
artifacts_created: [],
|
||||
decisions: 0,
|
||||
escalations: result.overallPassed ? 0 : 1,
|
||||
duration_ms: Date.now() - start,
|
||||
error: result.error,
|
||||
};
|
||||
}
|
||||
|
||||
private async runMechanicalTests(context: AgentContext): Promise<TesterResult> {
|
||||
try {
|
||||
const srcDir = path.join(context.project_path, "src");
|
||||
const integrationFiles = fs.existsSync(srcDir) ? this.findTestFiles(srcDir, /\.integration\.test\.ts$/) : [];
|
||||
const e2eFiles = fs.existsSync(srcDir) ? this.findTestFiles(srcDir, /\.e2e\.test\.ts$/) : [];
|
||||
const functionalFiles = fs.existsSync(srcDir) ? this.findTestFiles(srcDir, /\.functional\.test\.ts$/) : [];
|
||||
|
||||
const integrationTestsFound = integrationFiles.length;
|
||||
const e2eTestsFound = e2eFiles.length + functionalFiles.length;
|
||||
|
||||
let overallPassed = false;
|
||||
let integrationTestsPassed = 0;
|
||||
let e2eTestsPassed = 0;
|
||||
|
||||
try {
|
||||
const testOutput = execSync("npm test 2>&1", {
|
||||
cwd: context.project_path,
|
||||
encoding: "utf-8",
|
||||
stdio: ["pipe", "pipe", "pipe"],
|
||||
timeout: 120000,
|
||||
});
|
||||
overallPassed = true;
|
||||
|
||||
const passCounts = this.parseTestOutput(testOutput);
|
||||
integrationTestsPassed = integrationTestsFound > 0 ? integrationTestsFound : 0;
|
||||
e2eTestsPassed = e2eTestsFound > 0 ? e2eTestsFound : 0;
|
||||
|
||||
if (integrationTestsFound > 0) {
|
||||
integrationTestsPassed = this.estimateCategoryPassed(testOutput, "integration");
|
||||
}
|
||||
if (e2eTestsFound > 0) {
|
||||
e2eTestsPassed = this.estimateCategoryPassed(testOutput, "e2e");
|
||||
}
|
||||
} catch (err) {
|
||||
const output = err instanceof Error && "stdout" in err
|
||||
? (err as unknown as { stdout: string }).stdout || ""
|
||||
: "";
|
||||
const stderr = err instanceof Error && "stderr" in err
|
||||
? (err as unknown as { stderr: string }).stderr || ""
|
||||
: "";
|
||||
|
||||
const combined = `${output}\n${stderr}`;
|
||||
overallPassed = false;
|
||||
|
||||
const passCounts = this.parseTestOutput(combined);
|
||||
|
||||
if (integrationTestsFound > 0) {
|
||||
integrationTestsPassed = this.estimateCategoryPassed(combined, "integration");
|
||||
}
|
||||
if (e2eTestsFound > 0) {
|
||||
e2eTestsPassed = this.estimateCategoryPassed(combined, "e2e");
|
||||
}
|
||||
|
||||
return {
|
||||
success: false,
|
||||
integrationTestsFound,
|
||||
integrationTestsPassed,
|
||||
e2eTestsFound,
|
||||
e2eTestsPassed,
|
||||
overallPassed: false,
|
||||
error: `npm test failed: ${err instanceof Error ? err.message : String(err)}`,
|
||||
};
|
||||
}
|
||||
|
||||
return {
|
||||
success: overallPassed,
|
||||
integrationTestsFound,
|
||||
integrationTestsPassed,
|
||||
e2eTestsFound,
|
||||
e2eTestsPassed,
|
||||
overallPassed,
|
||||
};
|
||||
} catch (err) {
|
||||
return {
|
||||
success: false,
|
||||
integrationTestsFound: 0,
|
||||
integrationTestsPassed: 0,
|
||||
e2eTestsFound: 0,
|
||||
e2eTestsPassed: 0,
|
||||
overallPassed: false,
|
||||
error: `Test execution failed: ${err instanceof Error ? err.message : String(err)}`,
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
private findTestFiles(dir: string, pattern: RegExp): string[] {
|
||||
const files: string[] = [];
|
||||
if (!fs.existsSync(dir)) return files;
|
||||
const entries = fs.readdirSync(dir, { withFileTypes: true });
|
||||
for (const entry of entries) {
|
||||
const fullPath = path.join(dir, entry.name);
|
||||
if (entry.isDirectory() && entry.name !== "node_modules") {
|
||||
files.push(...this.findTestFiles(fullPath, pattern));
|
||||
} else if (pattern.test(entry.name)) {
|
||||
files.push(fullPath);
|
||||
}
|
||||
}
|
||||
return files;
|
||||
}
|
||||
|
||||
private parseTestOutput(output: string): { total: number; passed: number; failed: number } {
|
||||
const jestSummary = output.match(/Tests:\s+(\d+)\s+passed(?:,\s+(\d+)\s+failed)?/);
|
||||
if (jestSummary) {
|
||||
const passed = parseInt(jestSummary[1], 10) || 0;
|
||||
const failed = parseInt(jestSummary[2], 10) || 0;
|
||||
return { total: passed + failed, passed, failed };
|
||||
}
|
||||
|
||||
const jestAlt = output.match(/(\d+)\s+passing/);
|
||||
const jestAltFail = output.match(/(\d+)\s+failing/);
|
||||
if (jestAlt) {
|
||||
const passed = parseInt(jestAlt[1], 10) || 0;
|
||||
const failed = jestAltFail ? parseInt(jestAltFail[1], 10) || 0 : 0;
|
||||
return { total: passed + failed, passed, failed };
|
||||
}
|
||||
|
||||
return { total: 0, passed: 0, failed: 0 };
|
||||
}
|
||||
|
||||
private estimateCategoryPassed(output: string, category: string): number {
|
||||
const categoryPattern = category === "integration"
|
||||
? /\.integration\.test\.ts/g
|
||||
: /\.e2e\.test\.ts|\.functional\.test\.ts/g;
|
||||
|
||||
const mentions = (output.match(categoryPattern) || []).length;
|
||||
if (mentions > 0) {
|
||||
const failPattern = /FAIL|failed|error/i;
|
||||
const lines = output.split("\n").filter(l => categoryPattern.test(l));
|
||||
const failed = lines.filter(l => failPattern.test(l)).length;
|
||||
return Math.max(mentions - failed, 0);
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
Some files were not shown because too many files have changed in this diff Show More
Reference in New Issue
Block a user