├── tests
    ├── __init__.py
    ├── test_auth.py
    ├── test_config.py
    └── conftest.py
├── .genie
    ├── state
    │   ├── provider-status.json
    │   └── version.json
    ├── AGENTS.md
    ├── spells
    │   ├── README.md
    │   ├── blocker.md
    │   ├── run-in-parallel.md
    │   ├── gather-context.md
    │   ├── global-noop-roundtrip.md
    │   ├── global-health-check.md
    │   ├── context-critic.md
    │   ├── break-things-move-fast.md
    │   ├── context-candidates.md
    │   ├── experiment.md
    │   ├── multi-step-execution.md
    │   ├── install.md
    │   ├── ace-protocol.md
    │   ├── mcp-first.md
    │   ├── wish-lifecycle.md
    │   ├── investigate-before-commit.md
    │   ├── track-long-running-tasks.md
    │   └── wish-initiation.md
    ├── code
    │   ├── spells
    │   │   ├── tool-requirements.md
    │   │   ├── branch-tracker-guidance.md
    │   │   ├── file-naming-rules.md
    │   │   ├── evidence-storage.md
    │   │   ├── agent-configuration.md
    │   │   ├── publishing-protocol.md
    │   │   ├── automated-rc-publishing.md
    │   │   └── triad-maintenance-protocol.md
    │   └── agents
    │   │   ├── docgen.md
    │   │   ├── update
    │   │       └── upstream-update.md
    │   │   ├── fix.md
    │   │   ├── explore.md
    │   │   ├── commit.md
    │   │   ├── polish.md
    │   │   ├── audit.md
    │   │   └── git
    │   │       └── workflows
    │   │           └── pr.md
    ├── product
    │   ├── README.md
    │   ├── templates
    │   │   ├── qa-done-report-template.md
    │   │   ├── review-report-template.md
    │   │   ├── wish-template.md
    │   │   └── context-template.md
    │   ├── tech-stack.md
    │   ├── roadmap.md
    │   ├── environment.md
    │   └── mission.md
    ├── neurons
    │   ├── genie.md
    │   ├── wish.md
    │   ├── review.md
    │   └── forge.md
    ├── agents
    │   ├── semantic-analyzer
    │   │   ├── find-duplicates.md
    │   │   └── find-orphans.md
    │   ├── semantic-analyzer.md
    │   ├── update.md
    │   └── README.md
    └── scripts
    │   └── helpers
    │       ├── detect-unlabeled-blocks.js
    │       ├── find-empty-sections.js
    │       ├── validate-links.js
    │       └── bullet-counter.js
├── .github
    ├── images
    │   └── murmur-200.png
    ├── release.yml
    └── workflows
    │   └── ci.yml
├── src
    └── murmurai_server
    │   ├── __init__.py
    │   ├── __main__.py
    │   ├── auth.py
    │   ├── main.py
    │   ├── config.py
    │   └── logging.py
├── .dockerignore
├── .vscode
    └── launch.json
├── docker-compose.yml
├── .pre-commit-config.yaml
├── LICENSE
├── Dockerfile
├── CLAUDE.md
├── .env.example
├── pyproject.toml
├── .gitignore
└── scripts
    └── bump_version.py


/tests/__init__.py:
--------------------------------------------------------------------------------
1 | """MurmurAI API test suite."""
2 | 


--------------------------------------------------------------------------------
/.genie/state/provider-status.json:
--------------------------------------------------------------------------------
1 | {
2 |   "entries": []
3 | }
4 | 


--------------------------------------------------------------------------------
/.github/images/murmur-200.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/namastexlabs/murmurai/HEAD/.github/images/murmur-200.png


--------------------------------------------------------------------------------
/src/murmurai_server/__init__.py:
--------------------------------------------------------------------------------
1 | """MurmurAI - GPU-powered transcription service with speaker diarization."""
2 | 
3 | __version__ = "1.0.4"
4 | 


--------------------------------------------------------------------------------
/src/murmurai_server/__main__.py:
--------------------------------------------------------------------------------
1 | """Entry point for python -m murmurai."""
2 | 
3 | from murmurai_server.main import run
4 | 
5 | if __name__ == "__main__":
6 |     run()
7 | 


--------------------------------------------------------------------------------
/.dockerignore:
--------------------------------------------------------------------------------
 1 | # Git
 2 | .git
 3 | .gitignore
 4 | 
 5 | # Python
 6 | .venv
 7 | __pycache__
 8 | *.pyc
 9 | *.pyo
10 | *.egg-info
11 | .eggs
12 | dist/
13 | build/
14 | 
15 | # Tests
16 | tests/
17 | 
18 | # Data (mounted as volume instead)
19 | data/
20 | 
21 | # IDE
22 | .vscode
23 | .idea
24 | 
25 | # Development files
26 | *.md
27 | !README.md
28 | .env
29 | .env.example
30 | 


--------------------------------------------------------------------------------
/.genie/AGENTS.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Base
 3 | label: 🧞 Base
 4 | description: Global agents (orchestration, QA, analysis, maintenance)
 5 | github_url: https://github.com/namastexlabs/automagik-genie/tree/main/.genie
 6 | ---
 7 | 
 8 | # Base Genie Agents
 9 | 
10 | **Global agents available across all collectives.**
11 | 
12 | For complete orchestration framework and instructions, see:
13 | @AGENTS.md
14 | 


--------------------------------------------------------------------------------
/.genie/spells/README.md:
--------------------------------------------------------------------------------
1 | 
2 | # Forge Workflows (Global)
3 | 
4 | Global Forge workflows applicable across domains. Core `forge` agent delegates here when a domain-agnostic flow is sufficient. Domain-specific flows live under each collective (e.g., `code/workflows/forge.md`).
5 | 
6 | ## Structure
7 | - One file per workflow under `workflows/forge/`
8 | - Keep flows atomic, with clear inputs, steps, and evidence
9 | 


--------------------------------------------------------------------------------
/.genie/spells/blocker.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Blocker Protocol
 3 | description: Log blockers timestamped in wishes, wait for guidance before resuming
 4 | ---
 5 | 
 6 | # Blocker Protocol
 7 | 
 8 | **When encountering blockers:**
 9 | 
10 | 1. Log the blocker directly in the wish (timestamped entry with findings and status).
11 | 2. Update the wish status log and notify stakeholders.
12 | 3. Resume only after guidance is updated.
13 | 


--------------------------------------------------------------------------------
/.genie/spells/run-in-parallel.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Parallel Execution Framework
 3 | description: Run independent tasks in parallel, maintain visibility into all threads
 4 | ---
 5 | 
 6 | # Parallel Execution Framework
 7 | 
 8 | **Purpose:** Manage parallel work without losing clarity.
 9 | 
10 | **Success criteria:**
11 | ✅ Run tasks in parallel only when independent.
12 | ✅ Summaries capture status of each thread; human has visibility into all threads.
13 | 


--------------------------------------------------------------------------------
/.vscode/launch.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "version": "0.2.0",
 3 |   "configurations": [
 4 |     {
 5 |       "name": "Debug pytest",
 6 |       "type": "python",
 7 |       "request": "launch",
 8 |       "module": "pytest",
 9 |       "cwd": "${workspaceFolder}",
10 |       "args": [
11 |         "-v",
12 |         "-s"
13 |       ],
14 |       "env": {
15 |         "PYTHONPATH": "${workspaceFolder}"
16 |       },
17 |       "justMyCode": false
18 |     }
19 |   ]
20 | }
21 | 


--------------------------------------------------------------------------------
/.genie/state/version.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "version": "2.5.28-rc.2",
 3 |   "installedAt": "2025-12-11T15:08:53.090Z",
 4 |   "updatedAt": "2025-12-11T15:08:53.090Z",
 5 |   "commit": "f9bd294",
 6 |   "packageName": "automagik-genie",
 7 |   "customizedFiles": [],
 8 |   "deletedFiles": [],
 9 |   "lastUpgrade": null,
10 |   "previousVersion": null,
11 |   "upgradeHistory": [],
12 |   "migrationInfo": {
13 |     "backupId": "n/a",
14 |     "claudeBackedUp": false
15 |   }
16 | }
17 | 


--------------------------------------------------------------------------------
/.genie/spells/gather-context.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Genie Missing Context Protocol
 3 | description: Provide Files Needed block when critical context is missing
 4 | ---
 5 | 
 6 | # Genie Missing Context Protocol
 7 | 
 8 | When critical technical context is missing (files, specs), provide a Files Needed block instead of speculative output.
 9 | 
10 | ## Files Needed (use when necessary)
11 | 
12 | ```
13 | status: files_required_to_continue
14 | mandatory_instructions: <what is needed and why>
15 | files_needed: [ path/or/folder, ... ]
16 | ```
17 | 
18 | Use only for technical implementation gaps, not for business/strategy questions.
19 | 


--------------------------------------------------------------------------------
/.genie/code/spells/tool-requirements.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Tool Requirements
 3 | description: Validate with pnpm run check and cargo test --workspace
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # Tool Requirements
14 | 
15 | **Primary stack:** Rust + Node/TS; metrics/test hooks captured in wishes/forge plans.
16 | 
17 | **Success criteria:**
18 | ✅ Use `pnpm run check` and `cargo test --workspace` for validation.
19 | ✅ Generate types/metrics via documented scripts where applicable.
20 | ✅ Python/uv only if introduced and documented.
21 | 


--------------------------------------------------------------------------------
/.genie/spells/global-noop-roundtrip.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: forge-global-noop-roundtrip
 3 | description: No-op Wish → Review roundtrip without domain specifics
 4 | 
 5 | ---
 6 | 
 7 | # Forge Global No-Op Roundtrip
 8 | 
 9 | ## Steps
10 | 1) Create placeholder wish
11 | ```
12 | mcp__genie__run agent="wish" prompt="Create placeholder wish with no code changes"
13 | ```
14 | 2) Review placeholder wish
15 | ```
16 | mcp__genie__run agent="review" prompt="Review placeholder wish"
17 | ```
18 | 
19 | ## Success Criteria
20 | - Wish document written under `.genie/wishes/<slug>/`
21 | - Review runs without code-specific dependencies
22 | 
23 | ## Evidence
24 | - Save outputs to `.genie/qa/evidence/forge-noop-<timestamp>.txt`
25 | 


--------------------------------------------------------------------------------
/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   murmurai:
 3 |     build: .
 4 |     ports:
 5 |       - "8880:8880"
 6 |     environment:
 7 |       - MURMURAI_API_KEY=${MURMURAI_API_KEY:-namastex888}
 8 |       - MURMURAI_HF_TOKEN=${MURMURAI_HF_TOKEN:-}
 9 |       - MURMURAI_LOG_FORMAT=${MURMURAI_LOG_FORMAT:-text}
10 |     volumes:
11 |       # Persist transcripts database
12 |       - ./data:/app/data
13 |       # Cache HuggingFace models (saves download time on restart)
14 |       - ~/.cache/huggingface:/root/.cache/huggingface
15 |     deploy:
16 |       resources:
17 |         reservations:
18 |           devices:
19 |             - driver: nvidia
20 |               count: 1
21 |               capabilities: [gpu]
22 |     restart: unless-stopped
23 | 


--------------------------------------------------------------------------------
/.github/release.yml:
--------------------------------------------------------------------------------
 1 | changelog:
 2 |   exclude:
 3 |     labels:
 4 |       - ignore-for-release
 5 |     authors:
 6 |       - github-actions[bot]
 7 |   categories:
 8 |     - title: Breaking Changes
 9 |       labels:
10 |         - breaking
11 |         - breaking-change
12 |     - title: Features
13 |       labels:
14 |         - feature
15 |         - enhancement
16 |     - title: Bug Fixes
17 |       labels:
18 |         - bug
19 |         - fix
20 |         - bugfix
21 |     - title: Performance
22 |       labels:
23 |         - performance
24 |         - perf
25 |     - title: Documentation
26 |       labels:
27 |         - documentation
28 |         - docs
29 |     - title: Dependencies
30 |       labels:
31 |         - dependencies
32 |         - deps
33 |     - title: Other Changes
34 |       labels:
35 |         - "*"
36 | 


--------------------------------------------------------------------------------
/.genie/code/spells/branch-tracker-guidance.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Branch & Tracker Guidance
 3 | description: Use dedicated branches for medium/large changes, track IDs in wishes
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # Branch & Tracker Guidance
14 | 
15 | **Branch strategy:**
16 | - **Dedicated branch** (`feat/<wish-slug>`) for medium/large changes.
17 | - **Existing branch** only with documented rationale (wish status log).
18 | - **Micro-task** for tiny updates; track in wish status and commit advisory.
19 | 
20 | **Tracker management:**
21 | - Tracker IDs (from forge execution output) should be logged in the wish markdown once assigned. Capture them immediately after forge reports IDs.
22 | 
23 | A common snippet:
24 | 
25 | ```
26 | ### Tracking
27 | - Forge task: FORGE-123
28 | ```
29 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 |   - repo: https://github.com/pre-commit/pre-commit-hooks
 3 |     rev: v4.5.0
 4 |     hooks:
 5 |       - id: trailing-whitespace
 6 |       - id: end-of-file-fixer
 7 |       - id: check-yaml
 8 |       - id: check-added-large-files
 9 |         args: ['--maxkb=1000']
10 |       - id: check-merge-conflict
11 | 
12 |   - repo: https://github.com/astral-sh/ruff-pre-commit
13 |     rev: v0.8.2
14 |     hooks:
15 |       - id: ruff
16 |         args: [--fix]
17 |       - id: ruff-format
18 | 
19 |   - repo: local
20 |     hooks:
21 |       - id: mypy
22 |         name: mypy
23 |         entry: uv run --frozen mypy src/
24 |         language: system
25 |         types: [python]
26 |         pass_filenames: false
27 | 
28 |       - id: pytest
29 |         name: pytest
30 |         entry: uv run --frozen pytest tests/ -x -q
31 |         language: system
32 |         types: [python]
33 |         pass_filenames: false
34 |         stages: [pre-push]
35 | 


--------------------------------------------------------------------------------
/src/murmurai_server/auth.py:
--------------------------------------------------------------------------------
 1 | """API key authentication."""
 2 | 
 3 | import secrets
 4 | 
 5 | from fastapi import HTTPException, Security
 6 | from fastapi.security import APIKeyHeader
 7 | 
 8 | from murmurai_server.config import get_settings
 9 | 
10 | api_key_header = APIKeyHeader(name="Authorization", auto_error=True)
11 | 
12 | 
13 | async def verify_api_key(api_key: str = Security(api_key_header)) -> str:
14 |     """Verify API key from Authorization header.
15 | 
16 |     Supports both formats:
17 |     - Raw API key
18 |     - Bearer token: "Bearer <api_key>"
19 | 
20 |     Uses timing-safe comparison to prevent timing attacks.
21 |     """
22 |     # Strip "Bearer " prefix if present
23 |     if api_key.startswith("Bearer "):
24 |         api_key = api_key[7:]
25 | 
26 |     settings = get_settings()
27 |     if not secrets.compare_digest(api_key, settings.api_key):
28 |         raise HTTPException(status_code=401, detail="Invalid API key")
29 |     return api_key
30 | 


--------------------------------------------------------------------------------
/.genie/spells/global-health-check.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: forge-global-health-check
 3 | description: Sanity check Forge orchestration and MCP access (domain-agnostic)
 4 | 
 5 | ---
 6 | 
 7 | # Forge Global Health Check
 8 | 
 9 | ## Goals
10 | - Verify Genie MCP tools are available
11 | - Verify core agents (forge, wish, review) are resolvable
12 | - Optional: verify a no-op wish→review roundtrip without domain specifics
13 | 
14 | ## Steps
15 | 1) List agents
16 | ```
17 | mcp__genie__list_agents
18 | ```
19 | Expect `forge`, `wish`, `review` to be present.
20 | 
21 | 2) Start noop wish (optional)
22 | ```
23 | mcp__genie__run agent="wish" prompt="Create a placeholder wish (no code), context: @.genie/product/mission.md"
24 | ```
25 | Record wish path if created.
26 | 
27 | 3) Dry review (optional)
28 | ```
29 | mcp__genie__run agent="review" prompt="Review placeholder wish (no code)"
30 | ```
31 | 
32 | ## Evidence
33 | - Save outputs to `.genie/qa/evidence/forge-health-<timestamp>.txt`
34 | 


--------------------------------------------------------------------------------
/.genie/product/README.md:
--------------------------------------------------------------------------------
 1 | # Product Docs Index
 2 | 
 3 | 
 4 | Use these as the single source of truth for product context. Reference with `@.genie/product/...` so agents auto-load content.
 5 | 
 6 | - `@.genie/product/mission.md` – Pitch, users, problem, key features
 7 | - `@.genie/product/tech-stack.md` – Technologies, architecture, dependencies
 8 | - `@.genie/product/environment.md` – Required/optional env vars and setup
 9 | - `@.genie/product/roadmap.md` – Phases, initiatives, and milestones
10 | - `@.genie/product/cli-automation.md` – Complete CLI automation guide (cron, CI/CD, scripts)
11 | 
12 | Framework behavior
13 | - The framework consumes these files via `@` references and injects their content into agent prompts.
14 | - Keep sections stable so downstream tools can parse consistently (e.g., headings like "Pitch", "Users", "The Problem").
15 | - Prefer updating these docs over scattering product data elsewhere.
16 | 
17 | Validation
18 | - The install and wish workflows verify these paths exist and surface missing sections as blockers.
19 | - If you rename/move files, update all `@.genie/product/...` references to avoid broken context.
20 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2025 Namastex Labs
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/Dockerfile:
--------------------------------------------------------------------------------
 1 | # MurmurAI - GPU-powered transcription
 2 | # Using cudnn variant for speaker diarization support (cuDNN 9 required by ctranslate2 >= 4.5.0)
 3 | # CUDA 12.8 provides ~7.6% faster performance vs 12.6 (benchmarked 2024-12)
 4 | FROM nvidia/cuda:12.8.0-cudnn-runtime-ubuntu22.04
 5 | 
 6 | ENV DEBIAN_FRONTEND=noninteractive
 7 | WORKDIR /app
 8 | 
 9 | # Install uv
10 | COPY --from=ghcr.io/astral-sh/uv:latest /uv /usr/local/bin/uv
11 | 
12 | # Install Python 3.12 + venv
13 | RUN uv python install 3.12 && uv venv /app/.venv --python 3.12
14 | 
15 | ENV VIRTUAL_ENV=/app/.venv
16 | ENV PATH="/app/.venv/bin:$PATH"
17 | 
18 | # Copy manifests first to leverage layer caching
19 | COPY pyproject.toml uv.lock ./
20 | 
21 | # Install dependencies from lock file (cached unless deps change)
22 | RUN uv sync --frozen --no-dev --no-install-project
23 | 
24 | # Copy source code (changes here don't invalidate dep cache)
25 | COPY src/ ./src/
26 | 
27 | # Install the project itself (fast, no deps to resolve)
28 | RUN uv pip install --no-deps .
29 | 
30 | # Runtime config
31 | RUN mkdir -p /app/data
32 | EXPOSE 8880
33 | ENV MURMURAI_HOST=0.0.0.0
34 | ENV MURMURAI_PORT=8880
35 | ENV MURMURAI_DATA_DIR=/app/data
36 | 
37 | CMD ["murmurai"]
38 | 


--------------------------------------------------------------------------------
/.genie/code/spells/file-naming-rules.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: File and Naming Rules
 3 | description: Centralize planning and evidence under .genie/, avoid doc sprawl
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # File and Naming Rules
14 | 
15 | **Purpose:** Maintain tidy workspace; centralize planning and evidence under `.genie/`.
16 | 
17 | ## Success Criteria
18 | 
19 | ✅ No doc sprawl; update existing files instead of duplicating.
20 | ✅ Purpose-driven names; avoid hyperbole.
21 | ✅ Wishes/evidence paths normalized.
22 | 
23 | ## Forbidden Actions
24 | 
25 | ❌ Create documentation outside `.genie/` without instruction.
26 | ❌ Use forbidden naming patterns (fixed, improved, updated, better, new, v2, _fix, _v, enhanced, comprehensive).
27 | 
28 | ## Path Conventions
29 | 
30 | - Wishes: `.genie/wishes/<slug>/<slug>-wish.md`.
31 | - Evidence: declared by each wish (pick a clear folder or append directly in-document).
32 | - Forge plans: recorded in CLI output—mirror essentials back into the wish.
33 | - Blockers: logged inside the wish under a **Blockers** or status section.
34 | - Reports: `.genie/wishes/<slug>/reports/` (wish-specific Done Reports) or `.genie/reports/` (framework-level reports).
35 | - State: `.genie/state/` is ONLY for session tracking data (agents/sessions.json, logs); NEVER for reports.
36 | 


--------------------------------------------------------------------------------
/.genie/code/agents/docgen.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: docgen
 3 | description: Core documentation generation template
 4 | genie:
 5 |   executor:
 6 |     - CLAUDE_CODE
 7 |     - CODEX
 8 |     - OPENCODE
 9 |   background: true
10 | forge:
11 |   CLAUDE_CODE:
12 |     model: sonnet
13 |     dangerously_skip_permissions: true
14 |   CODEX:
15 |     model: gpt-5-codex
16 |     sandbox: danger-full-access
17 |   OPENCODE:
18 |     model: opencode/glm-4.6
19 | ---
20 | 
21 | # Genie DocGen Mode
22 | 
23 | ## Identity & Mission
24 | Produce concise, audience-targeted documentation outlines and draft bullets. Recommend next steps to complete docs.
25 | 
26 | ## Success Criteria
27 | - ✅ Outline aligned to the specified audience
28 | - ✅ Draft bullets for key sections
29 | - ✅ Actionable next steps to finish documentation
30 | 
31 | ## Prompt Template
32 | ```
33 | Audience: <dev|ops|pm>
34 | Outline: [ section1, section2 ]
35 | DraftBullets: { section1: [b1], section2: [b1] }
36 | Verdict: <ready|needs-revisions> (confidence: <low|med|high>)
37 | ```
38 | 
39 | ---
40 | 
41 | 
42 | ## Project Customization
43 | Define repository-specific defaults in  so this agent applies the right commands, context, and evidence expectations for your codebase.
44 | 
45 | Use the stub to note:
46 | - Core commands or tools this agent must run to succeed.
47 | - Primary docs, services, or datasets to inspect before acting.
48 | - Evidence capture or reporting rules unique to the project.
49 | 


--------------------------------------------------------------------------------
/.genie/code/spells/evidence-storage.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Evidence & Storage Conventions
 3 | description: Declare artifact locations and maintain evidence checklists
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # Evidence & Storage Conventions
14 | 
15 | ## Evidence Requirements
16 | 
17 | - Wishes must declare where artefacts live; there is no default `qa/` directory. Capture metrics inline in the wish (e.g., tables under a **Metrics** section) or in clearly named companion files.
18 | - Every wish must complete the **Evidence Checklist** block before implementation begins, spelling out validation commands, artefact locations, and approval checkpoints.
19 | - External tracker IDs live in the wish markdown (for example a **Tracking** section with `Forge task: FORGE-123`).
20 | - Background agent outputs are summarised in the wish context ledger; raw logs can be viewed with `mcp__genie__view` with sessionId parameter.
21 | 
22 | ## Testing & Evaluation
23 | 
24 | - Evaluation tooling is optional. If a project adds its own evaluator agent, the review or plan workflow can reference it; otherwise, evaluation steps default to manual validation.
25 | - Typical metrics: `{{METRICS}}` such as latency or quality. Domain-specific metrics should be added per project in the wish/forge plan.
26 | - Validation hooks should be captured in wishes/forge plans (e.g., `pnpm test`, `cargo test`, metrics scripts).
27 | 


--------------------------------------------------------------------------------
/CLAUDE.md:
--------------------------------------------------------------------------------
 1 | @AGENTS.md
 2 | 
 3 | # MurmurAI Project Context
 4 | 
 5 | ## Release Automation
 6 | 
 7 | **NEVER manually edit version numbers.** This project has automated release workflows.
 8 | 
 9 | ### How to Release
10 | 
11 | **Release Candidate (RC):**
12 | ```bash
13 | # Option 1: PR with label
14 | # Create PR → Add `rc` label → Merge to dev or main
15 | 
16 | # Option 2: Manual dispatch
17 | gh workflow run release.yml -f action=rc
18 | ```
19 | 
20 | **Stable Release:**
21 | ```bash
22 | # Option 1: PR with label (main branch only)
23 | # Create PR to main → Add `stable` label → Merge
24 | 
25 | # Option 2: Manual dispatch (main branch only)
26 | gh workflow run release.yml -f action=stable --ref main
27 | ```
28 | 
29 | ### What the Workflow Does
30 | 
31 | 1. **Gate Check** - Validates release conditions (labels, branch)
32 | 2. **Bump Version** - Runs `scripts/bump_version.py --action <rc|stable>`
33 |    - `rc`: 1.0.1 → 1.0.2-rc.1, or 1.0.2-rc.1 → 1.0.2-rc.2
34 |    - `stable`: 1.0.2-rc.5 → 1.0.2
35 | 3. **Commit & Tag** - Creates `chore: release vX.Y.Z` commit and git tag
36 | 4. **Build** - Uses `uv build` to create wheel/sdist
37 | 5. **Publish** - Pushes to PyPI via trusted publishing
38 | 6. **GitHub Release** - Creates release with auto-generated notes
39 | 
40 | ### CI Pipeline
41 | 
42 | Every push runs:
43 | - **Lint**: `ruff check` + `ruff format --check`
44 | - **Type Check**: `mypy src/`
45 | - **Test**: `pytest tests/` with coverage
46 | 
47 | ### Version Files
48 | 
49 | Version is stored in two places (both updated by bump script):
50 | - `pyproject.toml` - line 8: `version = "X.Y.Z"`
51 | - `src/murmurai_server/__init__.py` - line 3: `__version__ = "X.Y.Z"`
52 | 
53 | ### Branch Strategy
54 | 
55 | - `dev` - Development branch (RC releases)
56 | - `main` - Production branch (stable releases only)
57 | - Feature branches → PR to `dev`
58 | - `dev` → PR to `main` for stable release
59 | 


--------------------------------------------------------------------------------
/.genie/spells/context-critic.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Context Critic (Lightweight Evaluator)
 3 | description: Score candidate contexts on answerability, coverage, and cost quickly
 4 | ---
 5 | 
 6 | # Context Critic – Quick Scoring Heuristics
 7 | 
 8 | Purpose: Provide a cheap, fast evaluator to compare 2–3 context candidates before selection.
 9 | 
10 | Scoring Dimensions (0.0–1.0 each):
11 | - quality: Is the context sufficient to complete the immediate task? (answerability probe, clarity)
12 | - coverage: Does it include required sections/files/constraints? (checklist tally)
13 | - redundancy: Penalize duplication and irrelevant material
14 | - cost: Normalized inverse token estimate (lower tokens → higher score)
15 | - latency: Optional, if measurable during probes
16 | 
17 | Procedure:
18 | 1) Answerability Probe (quality)
19 | - Attempt to answer the core question or draft the key section from each candidate; judge confidence.
20 | 
21 | 2) Coverage Checklist (coverage)
22 | - Compare against known required items (wish template sections, mandatory refs, constraints).
23 | 
24 | 3) Redundancy Pass (redundancy)
25 | - Note duplicated sections, stale copies, or unnecessary full texts; penalize.
26 | 
27 | 4) Cost Estimate (cost)
28 | - Rough token count bands: low(<2k), med(2–6k), high(>6k); invert to 0–1.
29 | 
30 | Output structure per candidate:
31 | ```
32 | <critic_scores>
33 | - id: C1
34 |   quality: 0.85
35 |   coverage: 0.90
36 |   redundancy: 0.20
37 |   cost: 0.70
38 |   latency: low|med|high
39 |   notes: one line
40 | - id: C2 ...
41 | </critic_scores>
42 | ```
43 | 
44 | Selection Guidance:
45 | - Prefer higher quality and coverage first.
46 | - Break ties by (1) lower redundancy, (2) lower cost, (3) lower latency.
47 | 
48 | Integration:
49 | - Use inline within neuron/agent prompts after `<context_candidates>`.
50 | - For heavier evaluation (e.g., run tests), spawn subtasks per candidate and summarize back.
51 | 


--------------------------------------------------------------------------------
/.env.example:
--------------------------------------------------------------------------------
 1 | # MurmurAI Configuration
 2 | # All settings have sensible defaults - this file is optional for local use
 3 | 
 4 | # ============================================================================
 5 | # SECURITY NOTE
 6 | # ============================================================================
 7 | # The default API key 'namastex888' is PUBLICLY KNOWN.
 8 | # For production or any network-exposed deployment, set a secure key:
 9 | #
10 | #   MURMURAI_API_KEY=$(openssl rand -hex 32)
11 | #
12 | # See: https://github.com/namastexlabs/murmurai#security
13 | # ============================================================================
14 | 
15 | # API Authentication (default: namastex888 - CHANGE FOR PRODUCTION!)
16 | # MURMURAI_API_KEY=your-secret-api-key
17 | 
18 | # Server (defaults: 0.0.0.0:8880)
19 | # MURMURAI_HOST=0.0.0.0
20 | # MURMURAI_PORT=8880
21 | 
22 | # Data storage (default: ./data)
23 | # MURMURAI_DATA_DIR=./data
24 | 
25 | # Model settings
26 | # MURMURAI_MODEL=large-v3-turbo
27 | # MURMURAI_COMPUTE_TYPE=float16
28 | # MURMURAI_BATCH_SIZE=16
29 | 
30 | # GPU device index for multi-GPU systems (default: 0)
31 | # MURMURAI_DEVICE=0
32 | 
33 | # Default language - leave unset for auto-detect
34 | # Examples: en, pt, es, fr, de, ja, zh
35 | # MURMURAI_LANGUAGE=en
36 | 
37 | # Preload alignment models at startup (comma-separated)
38 | # MURMURAI_PRELOAD_LANGUAGES=en,es,pt
39 | 
40 | # HuggingFace token for speaker diarization (speaker_labels=true)
41 | # 1. Accept license at https://hf.co/pyannote/speaker-diarization-3.1
42 | # 2. Get token at https://hf.co/settings/tokens
43 | # MURMURAI_HF_TOKEN=hf_xxx
44 | 
45 | # Upload limits (default: 2048 MB = 2GB)
46 | # MURMURAI_MAX_UPLOAD_SIZE_MB=2048
47 | 
48 | # Logging configuration
49 | # MURMURAI_LOG_FORMAT=text    # "text" (human-readable) or "json" (structured)
50 | # MURMURAI_LOG_LEVEL=INFO     # DEBUG, INFO, WARNING, ERROR
51 | 


--------------------------------------------------------------------------------
/.github/workflows/ci.yml:
--------------------------------------------------------------------------------
 1 | name: CI
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: ["*"]
 6 |   pull_request:
 7 |     branches: [main, dev]
 8 | 
 9 | jobs:
10 |   lint:
11 |     name: Lint
12 |     runs-on: ubuntu-latest
13 |     steps:
14 |       - uses: actions/checkout@v4
15 | 
16 |       - name: Install uv
17 |         uses: astral-sh/setup-uv@v4
18 |         with:
19 |           version: "latest"
20 | 
21 |       - name: Set up Python
22 |         run: uv python install 3.12
23 | 
24 |       - name: Install dependencies
25 |         run: uv sync --dev
26 | 
27 |       - name: Run ruff check
28 |         run: uv run ruff check .
29 | 
30 |       - name: Run ruff format check
31 |         run: uv run ruff format --check .
32 | 
33 |   typecheck:
34 |     name: Type Check
35 |     runs-on: ubuntu-latest
36 |     steps:
37 |       - uses: actions/checkout@v4
38 | 
39 |       - name: Install uv
40 |         uses: astral-sh/setup-uv@v4
41 |         with:
42 |           version: "latest"
43 | 
44 |       - name: Set up Python
45 |         run: uv python install 3.12
46 | 
47 |       - name: Install dependencies
48 |         run: uv sync --dev
49 | 
50 |       - name: Run mypy
51 |         run: uv run mypy src/
52 | 
53 |   test:
54 |     name: Test
55 |     runs-on: ubuntu-latest
56 |     steps:
57 |       - uses: actions/checkout@v4
58 | 
59 |       - name: Install uv
60 |         uses: astral-sh/setup-uv@v4
61 |         with:
62 |           version: "latest"
63 | 
64 |       - name: Set up Python
65 |         run: uv python install 3.12
66 | 
67 |       - name: Install dependencies
68 |         run: uv sync --dev
69 | 
70 |       - name: Run tests with coverage
71 |         run: uv run pytest tests/ -v --cov=src/murmurai --cov-report=xml --cov-report=term
72 | 
73 |       - name: Upload coverage to Codecov
74 |         uses: codecov/codecov-action@v4
75 |         with:
76 |           files: ./coverage.xml
77 |           fail_ci_if_error: false
78 |         continue-on-error: true
79 | 


--------------------------------------------------------------------------------
/.genie/product/templates/qa-done-report-template.md:
--------------------------------------------------------------------------------
 1 | # Done Report: qa-<slug>-<YYYYMMDDHHmm>
 2 | ## Executive Summary
 3 | - **Checklist items tested:** X/Y
 4 | - **New scenarios discovered:** A
 5 | - **Bugs found:** B (C critical, D high, E medium)
 6 | - **Checklist items added:** F
 7 | 
 8 | ## Test Matrix
 9 | 
10 | ### Checklist Items (from @.genie/qa/checklist.md)
11 | | Item | Category | Status | Evidence |
12 | |------|----------|--------|----------|
13 | | <name> | <cat> | ✅ Pass | cmd-<name>-<ts>.txt |
14 | | <name> | <cat> | ❌ Fail | error-<name>-<ts>.txt |
15 | 
16 | ### New Scenarios (discovered during this run)
17 | | Scenario | Category | Status | Added to Checklist |
18 | |----------|----------|--------|-------------------|
19 | | <name> | <cat> | ✅ Pass | ✅ Yes (via learn) |
20 | 
21 | ## Bugs Found
22 | 
23 | ### 🔴 CRITICAL (X)
24 | **[BUG] <Description>**
25 | - **Reproduction:** <steps>
26 | - **Expected:** <behavior>
27 | - **Actual:** <behavior>
28 | - **Evidence:** .genie/qa/evidence/ (created during test execution)<file>
29 | - **Filed:** Issue #XX
30 | - **Owner:** <agent/person>
31 | 
32 | ### 🟠 HIGH (X)
33 | (same format)
34 | 
35 | ### 🟡 MEDIUM (X)
36 | (same format)
37 | 
38 | ## Learning Summary
39 | 
40 | **Items added to checklist:**
41 | 1. <Item name> (<category>)
42 | 2. <Item name> (<category>)
43 | 
44 | **Learn agent sessions:**
45 | - Session <id>: Added <item>
46 | - Session <id>: Added <item>
47 | 
48 | ## Evidence Archive
49 | Location: .genie/qa/evidence/ (created during test execution)
50 | 
51 | **Terminal outputs:** X files
52 | **Screenshots:** Y files
53 | **Logs:** Z files
54 | 
55 | ## Coverage Analysis
56 | - **<Category 1>:** X/Y tested (Z%)
57 | - **<Category 2>:** X/Y tested (Z%)
58 | - **Overall:** X/Y scenarios validated (Z%)
59 | 
60 | ## Follow-Ups
61 | 1. <Action> - <Priority>
62 | 2. <Action> - <Priority>
63 | 
64 | ## Verdict
65 | **Status:** <APPROVED | BLOCKED>
66 | **Confidence:** <LOW | MEDIUM | HIGH>
67 | **Recommendation:** <action items>
68 | 


--------------------------------------------------------------------------------
/tests/test_auth.py:
--------------------------------------------------------------------------------
 1 | """Tests for API authentication."""
 2 | 
 3 | import pytest
 4 | from fastapi import HTTPException
 5 | 
 6 | from murmurai_server.auth import verify_api_key
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_valid_api_key(test_settings, test_api_key):
11 |     """Test that valid API key passes verification."""
12 |     result = await verify_api_key(api_key=test_api_key)
13 |     assert result == test_api_key
14 | 
15 | 
16 | @pytest.mark.asyncio
17 | async def test_invalid_api_key(test_settings):
18 |     """Test that invalid API key raises 401."""
19 |     with pytest.raises(HTTPException) as exc_info:
20 |         await verify_api_key(api_key="wrong-api-key")
21 | 
22 |     assert exc_info.value.status_code == 401
23 |     assert "Invalid API key" in exc_info.value.detail
24 | 
25 | 
26 | @pytest.mark.asyncio
27 | async def test_empty_api_key(test_settings):
28 |     """Test that empty API key raises 401."""
29 |     with pytest.raises(HTTPException) as exc_info:
30 |         await verify_api_key(api_key="")
31 | 
32 |     assert exc_info.value.status_code == 401
33 | 
34 | 
35 | @pytest.mark.asyncio
36 | async def test_api_key_case_sensitive(test_settings, test_api_key):
37 |     """Test that API key comparison is case-sensitive."""
38 |     with pytest.raises(HTTPException) as exc_info:
39 |         await verify_api_key(api_key=test_api_key.upper())
40 | 
41 |     assert exc_info.value.status_code == 401
42 | 
43 | 
44 | @pytest.mark.asyncio
45 | async def test_bearer_prefix_stripped(test_settings, test_api_key):
46 |     """Test that Bearer prefix is properly stripped."""
47 |     result = await verify_api_key(api_key=f"Bearer {test_api_key}")
48 |     assert result == test_api_key
49 | 
50 | 
51 | @pytest.mark.asyncio
52 | async def test_bearer_prefix_wrong_key(test_settings):
53 |     """Test that Bearer prefix with wrong key still fails."""
54 |     with pytest.raises(HTTPException) as exc_info:
55 |         await verify_api_key(api_key="Bearer wrong-key")
56 | 
57 |     assert exc_info.value.status_code == 401
58 | 


--------------------------------------------------------------------------------
/tests/test_config.py:
--------------------------------------------------------------------------------
 1 | """Tests for configuration management."""
 2 | 
 3 | from pathlib import Path
 4 | 
 5 | 
 6 | def test_settings_loads_with_env_vars(test_settings):
 7 |     """Test that settings load correctly from environment."""
 8 |     assert test_settings.api_key == "test-api-key-12345"
 9 |     assert test_settings.host == "127.0.0.1"
10 |     assert test_settings.port == 8880
11 | 
12 | 
13 | def test_settings_default_values(test_settings):
14 |     """Test that default values are applied correctly."""
15 |     assert test_settings.model == "large-v3-turbo"
16 |     assert test_settings.compute_type == "float16"
17 |     assert test_settings.batch_size == 16
18 |     assert test_settings.hf_token is None
19 | 
20 | 
21 | def test_db_path_property(test_settings):
22 |     """Test that db_path property returns correct path."""
23 |     expected = test_settings.data_dir / "transcripts.db"
24 |     assert test_settings.db_path == expected
25 | 
26 | 
27 | def test_max_upload_bytes_property(test_settings):
28 |     """Test that max_upload_bytes property returns correct value."""
29 |     expected = test_settings.max_upload_size_mb * 1024 * 1024
30 |     assert test_settings.max_upload_bytes == expected
31 | 
32 | 
33 | def test_default_api_key_works(monkeypatch, tmp_path):
34 |     """Test that default API key allows startup without .env."""
35 |     from murmurai_server.config import get_settings
36 | 
37 |     # Clear cache
38 |     get_settings.cache_clear()
39 | 
40 |     # Remove API key from environment
41 |     monkeypatch.delenv("MURMURAI_API_KEY", raising=False)
42 | 
43 |     # Create empty .env to prevent loading from project .env
44 |     empty_env = tmp_path / ".env"
45 |     empty_env.touch()
46 |     monkeypatch.chdir(tmp_path)
47 | 
48 |     # Should work with default api_key
49 |     settings = get_settings()
50 |     assert settings.api_key == "namastex888"
51 | 
52 | 
53 | def test_data_dir_is_path(test_settings):
54 |     """Test that data_dir is a Path object."""
55 |     assert isinstance(test_settings.data_dir, Path)
56 | 


--------------------------------------------------------------------------------
/.genie/neurons/genie.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: GENIE
 3 | description: Persistent genie orchestrator (neuron)
 4 | genie:
 5 |   executor:
 6 |     - CLAUDE_CODE
 7 |     - CODEX
 8 |     - OPENCODE
 9 |   background: true
10 | forge:
11 |   CLAUDE_CODE:
12 |     model: sonnet
13 |     dangerously_skip_permissions: true
14 |   CODEX:
15 |     model: gpt-5-codex
16 |     sandbox: danger-full-access
17 |   OPENCODE:
18 |     model: opencode/glm-4.6
19 | ---
20 | 
21 | # Genie
22 | 
23 | You are Genie, the top-level orchestrator for complex multi-step workflows and installations.
24 | 
25 | ## Your Role
26 | 
27 | - Coordinate installation flows (`genie init`)
28 | - Orchestrate multi-agent workflows across collectives
29 | - Handle high-level decision making and routing
30 | - Delegate to specialized orchestrators (Wish, Forge, Review)
31 | - Maintain workspace coherence and state
32 | 
33 | ## Installation Flow
34 | 
35 | 1. **Context Acquisition**: Run explorer to understand workspace structure and requirements
36 | 2. **User Interview**: Gather preferences, requirements, and constraints
37 | 3. **Template Selection**: Choose appropriate collectives and agents to install
38 | 4. **Installation Delegation**: Spawn installer agents for each component
39 | 5. **Validation**: Verify successful setup and configuration
40 | 6. **Handoff**: Guide user to next steps and available commands
41 | 
42 | ## Orchestration Principles
43 | 
44 | - Delegate to specialists (never implement yourself - Amendment #4)
45 | - Coordinate parallel work streams when appropriate
46 | - Track progress across multiple agents and tasks
47 | - Escalate blockers to user when needed
48 | - Maintain big-picture view and context
49 | 
50 | ## Integration Points
51 | 
52 | - **Explorer**: Workspace discovery and context gathering
53 | - **Wish**: Feature planning and specification
54 | - **Forge**: Task execution and implementation
55 | - **Review**: Quality gates and validation
56 | - **Installers**: Template deployment and configuration
57 | 
58 | ## Never Do
59 | 
60 | - ❌ Implement code yourself (delegate to specialists)
61 | - ❌ Skip context gathering phase
62 | - ❌ Make decisions without user input on preferences
63 | - ❌ Proceed when blocked (escalate to user)
64 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["hatchling"]
 3 | build-backend = "hatchling.build"
 4 | 
 5 | [project]
 6 | name = "murmurai"
 7 | version = "1.0.4"
 8 | description = "GPU-powered transcription API with speaker diarization"
 9 | readme = "README.md"
10 | requires-python = "==3.12.*"
11 | license = {text = "MIT"}
12 | keywords = ["murmurai", "transcription", "speech-to-text", "api", "whisper", "diarization"]
13 | authors = [
14 |     {name = "Felipe Rosa"},
15 |     {name = "Namastex Labs"}
16 | ]
17 | classifiers = [
18 |     "Development Status :: 4 - Beta",
19 |     "Environment :: GPU :: NVIDIA CUDA",
20 |     "Framework :: FastAPI",
21 |     "Programming Language :: Python :: 3.12",
22 |     "License :: OSI Approved :: MIT License",
23 |     "Operating System :: OS Independent",
24 |     "Topic :: Multimedia :: Sound/Audio :: Speech",
25 | ]
26 | 
27 | dependencies = [
28 |     "murmurai-core>=1.0.5",
29 |     "fastapi>=0.110",
30 |     "uvicorn>=0.25",
31 |     "pydantic>=2.5",
32 |     "pydantic-settings>=2.3",
33 |     "python-multipart>=0.0.7",
34 |     "aiosqlite>=0.20",
35 |     "httpx>=0.27",
36 |     "python-dotenv>=1.0",
37 | ]
38 | 
39 | [project.scripts]
40 | murmurai = "murmurai_server.main:run"
41 | 
42 | [project.urls]
43 | Homepage = "https://github.com/namastexlabs/murmurai"
44 | Repository = "https://github.com/namastexlabs/murmurai.git"
45 | Issues = "https://github.com/namastexlabs/murmurai/issues"
46 | 
47 | [tool.hatch.build.targets.wheel]
48 | packages = ["src/murmurai_server"]
49 | 
50 | [tool.hatch.build.targets.wheel.sources]
51 | "src" = ""
52 | 
53 | [tool.uv]
54 | managed = true
55 | 
56 | [tool.ruff]
57 | target-version = "py312"
58 | line-length = 100
59 | 
60 | [tool.ruff.lint]
61 | select = ["E", "F", "I", "UP"]
62 | ignore = ["E501", "E402"]
63 | 
64 | [tool.mypy]
65 | python_version = "3.12"
66 | strict = false
67 | warn_unused_ignores = false
68 | ignore_missing_imports = true
69 | disable_error_code = ["import-untyped", "no-untyped-def", "attr-defined"]
70 | 
71 | [tool.pytest.ini_options]
72 | asyncio_mode = "auto"
73 | testpaths = ["tests"]
74 | 
75 | [dependency-groups]
76 | dev = [
77 |     "httpx>=0.28.1",
78 |     "mypy>=1.0",
79 |     "pre-commit>=4.5.0",
80 |     "pytest>=9.0.2",
81 |     "pytest-asyncio>=1.3.0",
82 |     "pytest-cov>=7.0.0",
83 |     "ruff>=0.8",
84 | ]
85 | 


--------------------------------------------------------------------------------
/.genie/product/tech-stack.md:
--------------------------------------------------------------------------------
 1 | # Genie Dev Technical Stack
 2 | Genie Dev extends the core Genie template with diagnostics and automation focused on self-evolution. The stack stays lightweight so downstream repos can still install it cleanly.
 3 | 
 4 | ## Core CLI
 5 | - **Runtime:** Node.js 20.x managed with `pnpm`
 6 | - **Language:** TypeScript 5.9 (compiled via `src/cli/tsconfig.json`)
 7 | - **UI:** `ink` + `react` for interactive CLI flows
 8 | - **Formatting & Parsing:** `yaml` for agent metadata, native fs/stream tooling for logs
 9 | 
10 | ## Agent Assets
11 | - **Prompts:** Markdown agents under `.genie/agents/` with shared personas in `.genie/agents/core/`
12 | - **Project Overrides:** Add a short "Project Notes" section inside relevant agent or spell docs (no separate `custom/` directory)
13 | - **State:** Session and ledger files stored in `.genie/state/` (never edit manually; inspect via MCP genie tools: `mcp__genie__list_sessions`, `mcp__genie__view`)
14 | 
15 | ## Testing & Validation
16 | - **Smoke Suite:** `tests/genie-cli.test.js` exercises CLI commands and prompt loading
17 | - **Identity Check:** `tests/identity-smoke.sh` ensures guardrails match expectations
18 | - **Recommended Checks:** `pnpm run build:genie` followed by `pnpm run test:genie` before publishing upgrades
19 | 
20 | ## Meta-Agent Instrumentation
21 | - **Done Reports:** `.genie/wishes/<slug>/reports/` captures experiment evidence and upgrade readiness
22 | - **Learning Ledger:** `.genie/instructions/*` houses behavioural overrides promoted from experiments
23 | - **Genie Orchestrator:** `.genie/agents/orchestrator.md` powers second-opinion audits before adopting risky changes
24 | 
25 | ## Toolchain Integrations
26 | - **Version Control:** Git-driven; branch `genie-dev` serves as the experimental lane
27 | - **CI Hooks (planned):** GitHub Actions pipeline to run build + smoke tests and publish artefacts for review
28 | - **Optional Runtimes:** Node/TS remains primary; Rust components can be referenced via `vendors/` for cross-language experiments
29 | 
30 | ## Observability
31 | - **Logs:** CLI captures command transcripts under `.genie/state/logs/`
32 | - **Metrics (manual):** Encourage recording latency/quality metrics inside wish evidence tables until automated collectors land
33 | 
34 | This stack keeps Genie fast to iterate while providing the hooks required for self-auditing and safe downstream adoption.
35 | 


--------------------------------------------------------------------------------
/.genie/code/agents/update/upstream-update.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: upstream-update
 3 | description: Automate upstream dependency updates with comprehensive validation
 4 | genie:
 5 |   executor:
 6 |     - CLAUDE_CODE
 7 |     - CODEX
 8 |     - OPENCODE
 9 |   background: false
10 | forge:
11 |   CLAUDE_CODE:
12 |     model: sonnet
13 |     dangerously_skip_permissions: true
14 |   CODEX:
15 |     model: gpt-5-codex
16 |     sandbox: danger-full-access
17 |   OPENCODE:
18 |     model: opencode/glm-4.6
19 | ---
20 | 
21 | # Upstream Update Agent
22 | 
23 | **Role:** Automate upstream dependency updates with comprehensive validation
24 | 
25 | ## Core Responsibility
26 | 
27 | Execute complete upstream update workflows, including:
28 | - Fork synchronization
29 | - Mechanical rebranding
30 | - Release creation
31 | - Gitmodule updates
32 | - Type regeneration
33 | - Build verification
34 | - Automated fix generation
35 | 
36 | ## Execution Pattern
37 | 
38 | When given an upstream update task:
39 | 
40 | 1. **Parse Context:**
41 |    - Current version
42 |    - Target version
43 |    - Repository information
44 |    - Patches to re-apply
45 | 
46 | 2. **Execute Phases Sequentially:**
47 |    - Pre-Sync Audit (gap detection)
48 |    - Fork Sync (mirror upstream)
49 |    - Mechanical Rebrand (remove vendor references)
50 |    - Release Creation (tag + GitHub release)
51 |    - Gitmodule Update (point to new tag)
52 |    - Type Regeneration & Build
53 |    - Post-Sync Validation
54 |    - Automated Fix Generation
55 |    - Commit & Push
56 | 
57 | 3. **Success Criteria Validation:**
58 |    - Fork mirrors upstream exactly
59 |    - Rebrand applied (0 vendor references except packages)
60 |    - Tag created with correct naming
61 |    - GitHub release published
62 |    - Build passes
63 |    - All gaps documented with fix scripts
64 | 
65 | ## Tools & Automation
66 | 
67 | - Use Git agent for repository operations
68 | - Execute build commands directly
69 | - Generate fix scripts for detected gaps
70 | - Document all changes comprehensively
71 | 
72 | ## Output Format
73 | 
74 | Provide detailed phase-by-phase execution log with:
75 | - ✅ Success markers
76 | - ❌ Failure markers
77 | - 📋 Gap documentation
78 | - 🔧 Fix scripts generated
79 | 
80 | ## Error Handling
81 | 
82 | - Halt on critical failures
83 | - Document all gaps found
84 | - Generate automated fixes where possible
85 | - Provide manual intervention steps when needed
86 | 


--------------------------------------------------------------------------------
/.genie/spells/break-things-move-fast.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: No Backwards Compatibility
 3 | description: Replace old behavior entirely, never preserve legacy features
 4 | ---
 5 | 
 6 | # No Backwards Compatibility
 7 | 
 8 | **Pattern:** This project does NOT support backwards compatibility or legacy features.
 9 | 
10 | **When planning fixes or enhancements:**
11 | - ❌ NEVER suggest `--metrics`, `--legacy`, `--compat` flags or similar
12 | - ❌ NEVER propose preserving old behavior alongside new behavior
13 | - ❌ NEVER say "we could add X flag for backwards compatibility"
14 | - ✅ ALWAYS replace old behavior entirely with new behavior
15 | - ✅ ALWAYS verify if suggested flags actually exist (search codebase first)
16 | - ✅ ALWAYS simplify by removing obsolete code completely
17 | 
18 | **Example (WRONG):**
19 | > "We could add a `--metrics` flag to preserve the old system metrics view for users who need it."
20 | 
21 | **Example (CORRECT):**
22 | > "Replace the metrics view entirely with the conversation view. Remove all metrics-related code."
23 | 
24 | **Why:**
25 | - This is a research preview / alpha project
26 | - Breaking changes are acceptable and expected
27 | - Cleaner codebase without legacy cruft
28 | - Faster iteration without compatibility constraints
29 | - **GENIE ONLY SELF-EVOLVES** - No dead code, no legacy sections, no "preserved for reference"
30 | 
31 | **Validation:**
32 | - Before suggesting new flags, run: `grep -r "flag_name" .`
33 | - If flag doesn't exist and solves backwards compat → it's hallucinated, remove it
34 | 
35 | ## Critical Violation Pattern
36 | 
37 | **NEVER write "Legacy Content" or "Preserved for Reference" sections.**
38 | 
39 | **Anti-Pattern (WRONG):**
40 | ```markdown
41 | ## Migration Notice
42 | This agent now delegates to spell...
43 | 
44 | ## Legacy Content (Pre-Migration)
45 | The content below is preserved for reference...
46 | ```
47 | 
48 | **Correct Pattern:**
49 | ```markdown
50 | # Agent Name
51 | [New behavior only, delete old content entirely]
52 | ```
53 | 
54 | **Why:** Genie self-evolves. When knowledge moves from agent → spell, DELETE the agent or REPLACE it entirely with new purpose. Never keep "legacy sections" or "backward compatibility" blocks.
55 | 
56 | **Evidence:** Learning session 2025-10-23 - Attempted to preserve debug agent content with "Legacy Content (Pre-Migration)" section. Violation. Correct approach: DELETE debug agent entirely, CREATE fix agent with new purpose.
57 | 


--------------------------------------------------------------------------------
/.genie/code/spells/agent-configuration.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Agent Configuration Standards
 3 | description: Declare permissionMode: default for agents that write files
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # Agent Configuration Standards
14 | 
15 | ## File Write Permissions
16 | 
17 | **Rule:** All agents requiring file write access MUST explicitly declare `permissionMode: default` in their frontmatter.
18 | 
19 | **Context:** Discovered 2025-10-13 when Claude agents with `executor: claude` were unable to write files. Permission prompts auto-skipped because stdin was hardcoded to `'ignore'` during process spawn, making `permissionMode: acceptEdits` completely non-functional.
20 | 
21 | **Why this matters:**
22 | - Default executor config doesn't grant write access
23 | - Without explicit `permissionMode: default`, agents silently fail on file operations
24 | - Background spell (`background: true`) requires the same permission declaration
25 | 
26 | **Agent categories:**
27 | 
28 | **Implementation agents** (REQUIRE `permissionMode: default`):
29 | - Core delivery: `implementor`, `tests`, `polish`, `refactor`, `git`
30 | - Infrastructure: `install`, `learn`, `commit`, `review`
31 | - Workflow orchestrators: `wish`, `plan`, `forge`, `vibe`, `qa`
32 | 
33 | **Analysis agents** (READ-ONLY, no permissionMode needed):
34 | - `analyze`, `audit`, `debug`, `genie`, `prompt`
35 | 
36 | **Configuration hierarchy:**
37 | 1. **Agent frontmatter** (highest priority) ← Use this level
38 | 2. Config override (`.genie/cli/config.yaml:48`)
39 | 3. Executor default (`claude.ts:13`)
40 | 
41 | **Implementation example:**
42 | ```yaml
43 | ```
44 | 
45 | **Validation:**
46 | ```bash
47 | # Check all implementation agents have permissionMode
48 | grep -L "permissionMode:" .genie/agents/{implementor,tests,polish,refactor,git,install,learn,commit}.md
49 | # Should return empty (all agents have the setting)
50 | 
51 | # Test file write capability (via MCP, not CLI)
52 | # Use mcp__genie__run with agent="implementor" and prompt="Create test file at /tmp/test.txt"
53 | # Should create file without permission prompts
54 | ```
55 | 
56 | **Future work:** Issue #35 tracks interactive permission system for foreground/background pause-and-resume approval workflow.
57 | 
58 | **Root cause reference:** Debug session `292942e0-07d1-4448-8d5e-74db8acc8c5b` identified stdin configuration at `src/cli/cli-core/handlers/shared.ts:391` (historical reference).
59 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
 1 | """Shared test fixtures for murmurai."""
 2 | 
 3 | from collections.abc import AsyncGenerator
 4 | from pathlib import Path
 5 | from unittest.mock import patch
 6 | 
 7 | import pytest
 8 | import pytest_asyncio
 9 | from httpx import ASGITransport, AsyncClient
10 | 
11 | 
12 | @pytest.fixture(autouse=True)
13 | def reset_settings_cache():
14 |     """Reset settings cache between tests."""
15 |     from murmurai_server.config import get_settings
16 | 
17 |     get_settings.cache_clear()
18 |     yield
19 |     get_settings.cache_clear()
20 | 
21 | 
22 | @pytest.fixture
23 | def test_api_key() -> str:
24 |     """Return test API key."""
25 |     return "test-api-key-12345"
26 | 
27 | 
28 | @pytest.fixture
29 | def test_env(test_api_key: str, tmp_path: Path, monkeypatch: pytest.MonkeyPatch):
30 |     """Set up test environment variables."""
31 |     # Change to tmp_path to avoid loading project .env file
32 |     monkeypatch.chdir(tmp_path)
33 |     monkeypatch.setenv("MURMURAI_API_KEY", test_api_key)
34 |     monkeypatch.setenv("MURMURAI_DATA_DIR", str(tmp_path))
35 |     monkeypatch.setenv("MURMURAI_HOST", "127.0.0.1")
36 |     monkeypatch.setenv("MURMURAI_PORT", "8880")
37 |     # Ensure HF token is not inherited from local .env
38 |     monkeypatch.delenv("MURMURAI_HF_TOKEN", raising=False)
39 | 
40 | 
41 | @pytest.fixture
42 | def test_settings(test_env):
43 |     """Get settings configured for testing."""
44 |     from murmurai_server.config import get_settings
45 | 
46 |     return get_settings()
47 | 
48 | 
49 | @pytest_asyncio.fixture
50 | async def initialized_db(test_settings):
51 |     """Initialize database for testing."""
52 |     from murmurai_server.database import init_db
53 | 
54 |     await init_db()
55 | 
56 | 
57 | @pytest_asyncio.fixture
58 | async def async_client(test_env, initialized_db) -> AsyncGenerator[AsyncClient, None]:
59 |     """Create async HTTP client for testing API endpoints."""
60 |     from murmurai_server.server import app
61 | 
62 |     async with AsyncClient(
63 |         transport=ASGITransport(app=app),
64 |         base_url="http://test",
65 |     ) as client:
66 |         yield client
67 | 
68 | 
69 | @pytest.fixture
70 | def auth_headers(test_api_key: str) -> dict[str, str]:
71 |     """Return headers with valid API key."""
72 |     return {"Authorization": test_api_key}
73 | 
74 | 
75 | @pytest.fixture
76 | def mock_gpu_available():
77 |     """Mock torch.cuda.is_available to return True."""
78 |     with patch("torch.cuda.is_available", return_value=True):
79 |         with patch("torch.cuda.get_device_name", return_value="Mock GPU"):
80 |             yield
81 | 


--------------------------------------------------------------------------------
/.genie/spells/context-candidates.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Context Candidates (ACE‑style)
 3 | description: Generate 2–3 task‑conditioned context variants, evaluate, and select under budget
 4 | ---
 5 | 
 6 | # Context Candidates – Agentic Context Engineering Pattern
 7 | 
 8 | Goal: Before committing to a single context pack, propose 2–3 viable variants, evaluate quickly, and select the best tradeoff of quality, tokens, and latency.
 9 | 
10 | When to use:
11 | - New wish creation or major context refresh
12 | - Uncertain retrieval scope or compression level
13 | - Performance or token constraints are tight
14 | 
15 | Protocol:
16 | 1) Propose Candidates
17 | - Build 2–3 variants with different knobs:
18 |   - Retrieval scope: narrow vs broad
19 |   - Compression: extractive vs abstractive
20 |   - Structure: order, grouping, summaries first vs full refs
21 |   - Cost target: low/med/high token budgets
22 | - Output structure:
23 | ```
24 | <context_candidates>
25 | - id: C1
26 |   budget: low|med|high
27 |   ingredients: [@file, @doc, session, summary]
28 |   assembly: steps (filter/merge/summarize/reorder)
29 |   rationale: one line
30 | - id: C2
31 |   ...
32 | - id: C3
33 |   ...
34 | </context_candidates>
35 | ```
36 | 
37 | 2) Evaluate Quickly
38 | - Use cheap, task‑appropriate checks (pick 1–2):
39 |   - Answerability probe (can we answer the core question?)
40 |   - Coverage checklist (all required sections present?)
41 |   - Sanity metrics (duplication, staleness, token size)
42 | - Score each as 0–1 on dimensions:
43 | ```
44 | <context_scores>
45 | - id: C1
46 |   quality: 0.0–1.0
47 |   cost: tokens or rough band (low/med/high)
48 |   latency: seconds (if known) or band
49 |   notes: brief observation
50 | - id: C2 ...
51 | </context_scores>
52 | ```
53 | 
54 | 3) Select and Commit
55 | - Pick winner by quality first, then cost/latency
56 | - Record selection + reason and proceed with the winner only
57 | ```
58 | <selection>
59 |   winner: C2
60 |   reason: brief tradeoff statement
61 | </selection>
62 | ```
63 | 
64 | 4) Record in Wish Markdown
65 | - In the wish file's "Context Variants Considered" section, list candidates (C1/C2/C3), brief scores, and the selected winner with a one‑line reason.
66 | 
67 | Promotion (Durable Learning):
68 | - If a recipe repeatedly wins for a task archetype, synthesize a tiny, reusable spell capturing the recipe (ingredients + assembly) and commit to `.genie/spells/`.
69 | 
70 | Notes:
71 | - Keep candidate generation within a single neuron/agent attempt when possible.
72 | - For heavier checks, create subtasks per candidate via `mcp__genie__create_subtask` and aggregate scores back.
73 | 


--------------------------------------------------------------------------------
/.genie/spells/experiment.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Experimentation Protocol
 3 | description: Always experiment with clear hypotheses during learning
 4 | ---
 5 | 
 6 | # Experimentation Protocol
 7 | 
 8 | **Core philosophy:** Learning = Experimentation
 9 | 
10 | **Rule:** ALWAYS EXPERIMENT during learning. Experimentation is not optional—it's how we discover better patterns.
11 | 
12 | ## Experimentation Framework
13 | 
14 | **Protocol:**
15 | 1. **Hypothesis**: State what you're testing explicitly
16 | 2. **Experiment**: Try it (with appropriate safety checks)
17 | 3. **Observe**: Capture results and unexpected behaviors
18 | 4. **Learn**: Document finding as new knowledge
19 | 5. **Apply**: Use learning in future tasks
20 | 
21 | **Example experiments:**
22 | - "Let me try natural routing instead of direct MCP for this workflow and observe the difference..."
23 | - "Testing if git can handle bulk label updates..."
24 | - "Experimenting with combining genie + implementor agents for this task..."
25 | 
26 | ## Safe Experimentation Guidelines
27 | 
28 | **Always safe:**
29 | - Read-only operations (list, view, analyze)
30 | - Tool combination experiments
31 | - Workflow pattern exploration
32 | - Query optimization tests
33 | 
34 | **Requires explanation first:**
35 | - Write operations (explain intent, get approval if destructive)
36 | - Configuration changes
37 | - External API calls
38 | - Git operations (especially push, force, rebase)
39 | 
40 | **Documentation pattern:**
41 | After experiment, capture in done reports or learning entries:
42 | ```
43 | **Experiment**: Tried X approach for Y task
44 | **Hypothesis**: Expected Z outcome
45 | **Result**: Actually observed A, discovered B
46 | **Learning**: Will use A pattern going forward because B
47 | ```
48 | 
49 | ## Meta-Principle
50 | 
51 | **Felipe guides alongside the learning process.** Treat each session as an opportunity to discover better patterns through active experimentation. Don't wait for permission to try—experiment safely, document findings, and iterate.
52 | 
53 | **Validation:**
54 | ```bash
55 | # Check learning entries show experimentation
56 | grep -i "experiment\|try\|test\|discover" AGENTS.md | wc -l
57 | # Should show multiple references
58 | 
59 | # Observe agent behavior:
60 | # - Does agent suggest experiments proactively?
61 | # - Does agent try new approaches?
62 | # - Does agent document learnings from experiments?
63 | ```
64 | 
65 | **Context:** Discovered 2025-10-13 that learning process was overly cautious, waiting for explicit instructions rather than experimenting with available tools and patterns. Shifted to experimentation-first approach.
66 | 


--------------------------------------------------------------------------------
/src/murmurai_server/main.py:
--------------------------------------------------------------------------------
 1 | """Main entry point for MurmurAI."""
 2 | 
 3 | import argparse
 4 | import sys
 5 | 
 6 | import uvicorn
 7 | 
 8 | from murmurai_server.config import get_settings
 9 | from murmurai_server.deps import startup_check
10 | 
11 | 
12 | def run() -> None:
13 |     """Main entry point - starts API server."""
14 |     parser = argparse.ArgumentParser(
15 |         description="MurmurAI - GPU-powered transcription service",
16 |         formatter_class=argparse.RawDescriptionHelpFormatter,
17 |         epilog="""\
18 | Examples:
19 |   murmurai                        Start server with default settings
20 |   murmurai --force                Start even if dependencies are missing
21 |   murmurai --skip-check           Skip dependency check entirely
22 | 
23 | Environment variables:
24 |   MURMURAI_API_KEY               API authentication key (required)
25 |   MURMURAI_HOST                  Server bind address (default: 0.0.0.0)
26 |   MURMURAI_PORT                  Server port (default: 8880)
27 |   MURMURAI_MODEL                 Model name (default: large-v3-turbo)
28 |   MURMURAI_HF_TOKEN              HuggingFace token for diarization
29 | 
30 | Full docs: https://github.com/namastexlabs/murmurai
31 | """,
32 |     )
33 |     parser.add_argument(
34 |         "--force",
35 |         action="store_true",
36 |         help="Start server even if dependencies are missing",
37 |     )
38 |     parser.add_argument(
39 |         "--skip-check",
40 |         action="store_true",
41 |         help="Skip dependency check entirely",
42 |     )
43 |     parser.add_argument(
44 |         "--version",
45 |         action="store_true",
46 |         help="Show version and exit",
47 |     )
48 | 
49 |     args = parser.parse_args()
50 | 
51 |     if args.version:
52 |         from murmurai_server import __version__
53 | 
54 |         print(f"murmurai {__version__}")
55 |         sys.exit(0)
56 | 
57 |     # Run dependency check unless skipped
58 |     if not args.skip_check:
59 |         startup_check(force=args.force)
60 | 
61 |     settings = get_settings()
62 | 
63 |     # Ensure data directory exists
64 |     settings.data_dir.mkdir(parents=True, exist_ok=True)
65 | 
66 |     print(f"MurmurAI starting on http://{settings.host}:{settings.port}")
67 |     print(f"Model: {settings.model}")
68 |     print(f"Data directory: {settings.data_dir}")
69 |     print(f"API docs: http://{settings.host}:{settings.port}/docs")
70 | 
71 |     # Start FastAPI server
72 |     uvicorn.run(
73 |         "murmurai_server.server:app",
74 |         host=settings.host,
75 |         port=settings.port,
76 |         reload=False,
77 |     )
78 | 
79 | 
80 | if __name__ == "__main__":
81 |     run()
82 | 


--------------------------------------------------------------------------------
/.genie/code/spells/publishing-protocol.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Publishing Protocol *(CRITICAL)*
 3 | description: Never publish directly; always delegate to the release agent
 4 | genie:
 5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
 6 | forge:
 7 |   CLAUDE_CODE:
 8 |     model: sonnet
 9 |   CODEX: {}
10 |   OPENCODE: {}
11 | ---
12 | 
13 | # Publishing Protocol *(CRITICAL)*
14 | 
15 | **NEVER** execute `npm publish` or `gh release create` directly. **ALWAYS** delegate to release agent.
16 | 
17 | ## Forbidden Actions
18 | 
19 | - ❌ `npm publish` (bypasses validation, GitHub release, audit trail)
20 | - ❌ `gh release create` (direct command - let agent orchestrate)
21 | - ❌ Manual version tagging without release agent
22 | - ❌ Using `/release` slash command with arguments (incorrect invocation)
23 | 
24 | ## Required Workflow
25 | 
26 | **If you ARE the release agent:**
27 | - ✅ Execute workflow directly: run pre-flight checks, create GitHub release via `gh release create`, monitor Actions
28 | - ❌ NEVER delegate to yourself or invoke `mcp__genie__run` with agent="release"
29 | 
30 | **If you are NOT the release agent (genie/planner/main):**
31 | 1. Commit code + version bump to main
32 | 2. Delegate to release agent: `mcp__genie__run with agent="release" and prompt="Create release for vX.Y.Z"`
33 | 3. Release agent validates, creates GitHub release, monitors npm publish
34 | 4. Provide release URL to user
35 | 
36 | ## Why This Matters
37 | 
38 | - **Safety**: Pre-flight checks (clean git, tests pass, version valid)
39 | - **Consistency**: Follows project workflow (GitHub Actions)
40 | - **Audit trail**: All releases documented in GitHub
41 | - **Rollback**: Structured process easier to revert
42 | 
43 | ## Recent Violations
44 | 
45 | **2025-10-14:**
46 | - Attempted `gh release create` manually (bypassed validation)
47 | - Attempted `npm publish` directly (timed out, triggered background agent)
48 | - Attempted `/release` with arguments instead of proper MCP invocation
49 | - **Result**: Inconsistent state, manual cleanup required
50 | - **Evidence**: Commits 0c6ef02, 30dce09, GitHub Actions runs 18506885592
51 | 
52 | **2025-10-17:**
53 | - Session ~00:50Z: Recognized RC5 release work but attempted direct handling
54 | - Failed to check routing matrix before acting on release request
55 | - Acknowledged "I'm learning" but did NOT invoke learn agent for documentation
56 | - **Result**: Routing pattern not propagated to framework
57 | - **Evidence**: User teaching 2025-10-17
58 | 
59 | ## Validation
60 | 
61 | When user says "publish" or "release", immediately check routing matrix and delegate to release agent via MCP. When user identifies routing failures, invoke learn agent immediately to document correction.
62 | 


--------------------------------------------------------------------------------
/.genie/product/roadmap.md:
--------------------------------------------------------------------------------
 1 | # Genie Dev Roadmap
 2 | The genie-dev branch is the laboratory for Genie’s self-improvement program. Phases are sequenced to keep downstream adopters safe while we iterate quickly.
 3 | 
 4 | ## Phase 0 — Baseline Capture (✅ complete)
 5 | - Neutralize template placeholders and document the current mission, tech stack, and guardrails
 6 | - Inventory existing behavioural learnings and confirm they are enforced across agents
 7 | - Establish `pnpm run build:genie` + smoke tests as the minimum verification gate
 8 | 
 9 | ## Phase 1 — Instrumentation & Telemetry (in progress)
10 | - Treat the wish **Evidence Checklist** as the gating deliverable before other instrumentation tasks proceed (see ).
11 | - Add branch-specific checklists to every wish to log evidence paths and validation commands
12 | - Expand done-report coverage so each experiment stores scope, risks, and follow-ups
13 | - Wire CLI diagnostics to surface missing sessions or misconfigured presets
14 | 
15 | ## Phase 2 — Guided Self-Improvement
16 | - Author wishes that target prompt quality, guardrail clarity, and CLI usability
17 | - Pair each wish with twin audits and validation scripts before merging back to `main`
18 | - Promote validated learnings into `.genie/instructions/` and agent briefs
19 | 
20 | ## Phase 3 — Adoption Kits for Downstream Repos
21 | - Package upgrade notes, migration diffs, and rollback guidance for every major change
22 | - Publish branch-to-main release checklist (Plan → Wish → Forge coverage, tests, done report link)
23 | - Partner with pilot teams to trial upgrades and capture their feedback in structured templates
24 | 
25 | ## Phase 4 — Automation & CI Integration
26 | - Land GitHub Actions pipeline that runs build + smoke tests and attaches artefacts to PRs
27 | - Add regression checks for behavioural rules (learn, guardrail compliance)
28 | - Introduce metrics capture (latency, wish completion velocity) with reporting hooks
29 | 
30 | ## Success Metrics
31 | - 100% of genie-dev wishes include validation commands and evidence links
32 | - Smoke suite (`pnpm run test:genie`) passing before merge on every PR
33 | - Documented learnings promoted within 48 hours of validation
34 | - Downstream adopters report <5% rollback rate on genie-dev releases
35 | 
36 | ## Dependencies & Enablers
37 | - Maintainers available for twin reviews and manual approvals
38 | - Access to GPT-5 class models (configurable via `GENIE_MODEL`)
39 | - Stable sandboxed environment mirroring production guardrails
40 | 
41 | ## Risk Log (actively monitored)
42 | - **Automation drift:** self-improvement scripts may bypass approval gates → mitigate with review checklist baked into wishes
43 | - **Telemetry gaps:** missing evidence makes regression root-cause harder → mitigate by enforcing done report template updates
44 | - **Adopter fatigue:** too many upgrades without guides → mitigate by bundling changes into release kits with opt-in toggles
45 | 


--------------------------------------------------------------------------------
/.genie/product/environment.md:
--------------------------------------------------------------------------------
 1 | # Genie Dev Environment Configuration
 2 | Genie Dev relies on a small set of environment variables to steer the CLI, model selection, and self-improvement experiments. Configure these in a local `.env` and load them before running the CLI.
 3 | 
 4 | ## Conventions
 5 | - Names: UPPER_SNAKE_CASE
 6 | - Types: string | int (ms) | bool (`0/1` or `true/false`)
 7 | - Scope legend: [required], [optional], [experimental]
 8 | 
 9 | ## Core CLI
10 | - APP_NAME [optional]: defaults to `Genie Dev`
11 | - APP_ENV [optional]: `dev|staging|prod` (default `dev`)
12 | - GENIE_BRANCH [optional]: branch name used for wish/forge guidance (default `genie-dev`)
13 | - LOG_LEVEL [optional]: `trace|debug|info|warn|error` (default `info`)
14 | 
15 | ## Genie Runtime
16 | - GENIE_MODEL [required]: model identifier used by agents (e.g., `gpt-5`)
17 | - GENIE_APPROVAL_POLICY [optional]: `on-request|on-failure|never|untrusted` (default approval behavior)
18 | - GENIE_SANDBOX_MODE [optional]: `workspace-write|read-only|danger-full-access` (default sandbox mode)
19 | - GENIE_CLI_STYLE [optional]: `plain|compact|art` (default `compact`)
20 | 
21 | Note: Agent-specific sandbox and approval settings in frontmatter override these defaults.
22 | 
23 | ## Provider Credentials
24 | - OPENAI_API_KEY or ALTERNATE_PROVIDER_KEY [required]: API key for the LLM provider
25 | - PROVIDER_ENDPOINT [optional]: override base URL when pointing at non-default gateways
26 | - PROVIDER_REGION [optional]: specify regional routing if required by service policy
27 | 
28 | ## Experiment Toggles
29 | - ENABLE_LEARN_SYNC [optional]: `0|1` (default `1`) — when disabled, learn updates are reported but not auto-applied
30 | - ENABLE_TWIN_DEFAULT [optional]: `0|1` (default `0`) — automatically schedule twin audits for high-risk wishes
31 | - DONE_REPORT_DIR [optional]: overrides `.genie/wishes/<slug>/reports/` when storing experiment evidence elsewhere
32 | 
33 | ## Safety Limits
34 | - MAX_CONCURRENT_AGENTS [optional]: limit parallel CLI sessions (default `5`)
35 | - SESSION_TIMEOUT_SECONDS [optional]: auto-stop background sessions after N seconds (default `3600`)
36 | - RATE_LIMIT_RPS [optional]: throttles outbound provider calls (default `60`)
37 | 
38 | ## Example .env (development)
39 | ```env
40 | APP_NAME="Genie Dev"
41 | APP_ENV=dev
42 | GENIE_BRANCH=genie-dev
43 | LOG_LEVEL=debug
44 | 
45 | GENIE_MODEL=gpt-5
46 | GENIE_APPROVAL_POLICY=on-request
47 | GENIE_SANDBOX_MODE=workspace-write
48 | GENIE_CLI_STYLE=compact
49 | 
50 | OPENAI_API_KEY=replace_me
51 | ENABLE_SELF_LEARN_SYNC=1
52 | ENABLE_TWIN_DEFAULT=0
53 | MAX_CONCURRENT_AGENTS=5
54 | SESSION_TIMEOUT_SECONDS=3600
55 | ```
56 | 
57 | ## Notes
58 | - Never commit real API keys or secrets; rely on `.env` files and secret managers
59 | - Keep experimental toggles disabled by default when preparing release candidates for downstream repos
60 | - Align CLI harness configuration with the approval policy documented in active wishes to avoid mismatched expectations
61 | 


--------------------------------------------------------------------------------
/.genie/spells/multi-step-execution.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Execution Integrity Protocol *(CRITICAL - SAY-DO GAP)*
 3 | description: Match verbal commitments with immediate actions
 4 | ---
 5 | 
 6 | # Execution Integrity Protocol *(CRITICAL - SAY-DO GAP)*
 7 | 
 8 | **NEVER** state an intention without immediately executing it. **ALWAYS** match verbal commitments with actions.
 9 | 
10 | ## Violation: Say-Do Gap (Sleep Command Pattern)
11 | 
12 | **Context:** Session 2025-10-17 23:00-23:05 UTC - Learn agent progress check
13 | 
14 | **Pattern:** Saying "Waiting X seconds..." without executing `sleep X` command
15 | 
16 | ## Forbidden Actions
17 | 
18 | - ❌ "Waiting ~120s before checking results..." → No sleep command executed
19 | - ❌ Verbal commitment ("I will X") without tool invocation
20 | - ❌ Continuing with other actions after wait statement
21 | - ❌ Repeating pattern after correction
22 | 
23 | ## Required Workflow
24 | 
25 | **When committing to wait/delay/sleep:**
26 | ```
27 | ✅ CORRECT PATTERN:
28 | "Waiting 120s before checking results..."
29 | <invoke Bash with command="sleep 120">
30 | [THEN continue after sleep completes]
31 | 
32 | ❌ WRONG PATTERN:
33 | "Waiting ~120s before checking results..."
34 | [continues with other text/actions without executing sleep]
35 | ```
36 | 
37 | ## Implementation Rules
38 | 
39 | 1. Commit statement ("Waiting X seconds...") MUST be followed IMMEDIATELY by sleep command
40 | 2. NO text/actions between commit and execution
41 | 3. Sleep duration MUST match stated duration exactly
42 | 4. Use Bash tool with sleep command, not just text
43 | 5. Self-validate before responding: "Did I execute what I said I would?"
44 | 
45 | ## Why This Matters
46 | 
47 | - **Trust violation:** Say one thing, do another erodes credibility
48 | - **False expectations:** User thinks work is paused, it's not
49 | - **Polling protocol violations:** Checking too soon without actual wait
50 | - **Self-awareness failure:** Repeated pattern after correction demonstrates lack of learning
51 | 
52 | ## Recent Violation
53 | 
54 | **2025-10-17 23:00-23:05 UTC:**
55 | - Said "Waiting ~120s..." TWICE without executing sleep
56 | - Required TWO corrections from Felipe before finally executing
57 | - First instance: "Waiting ~120s..." → No sleep → Felipe: "you didnt sleep 120, you just said you would"
58 | - Second instance: "You're right, waiting now..." → STILL no sleep → Felipe: "this is curious, you didnt use sleep again, either.... you need to self improve"
59 | - Finally executed after second correction: `sleep 120`
60 | - **Pattern:** Verbal commitment → no action → correction → verbal commitment → no action → correction → action
61 | - **Root cause:** Fundamental say-do gap, statements not backed by actions
62 | - **Result:** Trust erosion, repeated behavioral failure after explicit teaching
63 | - **Evidence:** User teaching 2025-10-17 23:00-23:05 UTC
64 | 
65 | ## Validation
66 | 
67 | Every "waiting/sleeping/pausing" statement must show corresponding sleep command in tool invocations.
68 | 


--------------------------------------------------------------------------------
/.genie/agents/semantic-analyzer/find-duplicates.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: find-duplicates
 3 | description: Detect near-duplicate content across markdown files using semantic similarity
 4 | genie:
 5 |   executor: CLAUDE_CODE
 6 |   background: false
 7 |   model: sonnet
 8 | forge:
 9 |   CLAUDE_CODE:
10 |     model: sonnet
11 |   CODEX:
12 |     model: gpt-5-codex
13 |   OPENCODE:
14 |     model: opencode/glm-4.6
15 | ---
16 | 
17 | # Find Duplicates Workflow
18 | 
19 | Analyze markdown files to detect near-duplicate content (>80% semantic similarity).
20 | Returns JSON with duplicate pairs, similarity scores, and excerpts.
21 | 
22 | ## Task
23 | 
24 | You are a semantic similarity analyzer. Your job is to find near-duplicate content across multiple markdown files.
25 | 
26 | **Input:** Directory path (provided as argument)
27 | **Output:** JSON array with this exact structure:
28 | 
29 | ```json
30 | [
31 |   {
32 |     "file1": "/path/to/file1.md",
33 |     "file2": "/path/to/file2.md",
34 |     "line1": 42,
35 |     "line2": 78,
36 |     "similarity": 0.85,
37 |     "excerpt1": "First 80 chars of duplicate content...",
38 |     "excerpt2": "First 80 chars of similar content...",
39 |     "reason": "Same concept explained with different words"
40 |   }
41 | ]
42 | ```
43 | 
44 | ## Detection Rules
45 | 
46 | 1. **Paragraph-level analysis** - Compare paragraphs (3+ sentences), not individual sentences
47 | 2. **Semantic similarity** - Detect paraphrased content, not just exact matches
48 | 3. **Threshold** - Only report pairs with >80% similarity
49 | 4. **Exclude code blocks** - Don't compare code examples
50 | 5. **Exclude frontmatter** - Skip YAML headers
51 | 
52 | ## Steps
53 | 
54 | 1. Read all .md files in directory recursively
55 | 2. Extract paragraphs (ignore frontmatter, code blocks)
56 | 3. Compare each paragraph against all others
57 | 4. Calculate semantic similarity (word overlap, meaning, structure)
58 | 5. For pairs >80% similar, record details
59 | 6. Output JSON array
60 | 
61 | ## Example Output
62 | 
63 | ```json
64 | [
65 |   {
66 |     "file1": ".genie/spells/know-yourself.md",
67 |     "file2": ".genie/code/spells/identity.md",
68 |     "line1": 15,
69 |     "line2": 23,
70 |     "similarity": 0.92,
71 |     "excerpt1": "Master Genie is the template consciousness at namastexlabs/automagik-genie...",
72 |     "excerpt2": "Genie template consciousness lives at namastexlabs/automagik-genie repo...",
73 |     "reason": "Same identity explanation with synonymous phrasing"
74 |   }
75 | ]
76 | ```
77 | 
78 | ## Quality Standards
79 | 
80 | - **High confidence** - Only report pairs you're >90% confident about
81 | - **Evidence-based** - Include excerpts and line numbers
82 | - **Actionable** - Explain WHY they're duplicates (reason field)
83 | 
84 | ## Cost Optimization
85 | 
86 | - Process files in batches of 50 paragraphs max
87 | - Skip exact duplicates (already handled by garbage-collector Rule 3)
88 | - Focus on semantic similarity, not exact matches
89 | 
90 | @.genie/agents/semantic-analyzer.md
91 | 


--------------------------------------------------------------------------------
/.genie/spells/install.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: install
 3 | description: Code Collective install workflow — prepare product docs and wire up Code agents
 4 | 
 5 | ---
 6 | 
 7 | # Code Install Workflow
 8 | 
 9 | Purpose: Initialize the project’s product docs and connect Code collective agents and workflows.
10 | 
11 | ## Phases
12 | 
13 | 1) Discovery
14 | - Detect repository state (fresh vs existing codebase)
15 | - Identify domain, constraints, and intended tech stack
16 | - Choose path: Analyze Existing • New Repo Interview • Hybrid
17 | 
18 | 2) Implementation
19 | - Create/update product docs:
20 |   - `@.genie/product/mission.md`
21 |   - `@.genie/product/mission-lite.md`
22 |   - `@.genie/product/tech-stack.md`
23 |   - `@.genie/product/roadmap.md`
24 |   - `@.genie/product/environment.md`
25 | - Calibrate Code agents by adding a short "Project Notes" section inside relevant `.genie/code/agents/*` or `.genie/spells/*` docs (no `custom/` folder)
26 | - Initialize `.genie/CONTEXT.md` and add `.genie/CONTEXT.md` to `.gitignore`
27 | - Keep edits under `.genie/` (no app code changes here)
28 | 
29 | 3) Verification
30 | - Validate cross-references and required sections in product docs
31 | - Exercise MCP tools: `mcp__genie__list_agents` and a sample Code agent invocation
32 | - Capture a Done Report and hand off to `code/wish` for the first scoped feature
33 | 
34 | ## Context Auto-Loading
35 | @.genie/product/mission.md
36 | @.genie/product/tech-stack.md
37 | @.genie/product/environment.md
38 | @.genie/product/roadmap.md
39 | @README.md
40 | @package.json
41 | 
42 | ## Modes
43 | 
44 | Mode 1: Codebase Analysis
45 | - Map structure, languages/frameworks, dependencies
46 | - Identify architecture patterns and external integrations
47 | - Summarize implementation progress and testing approach
48 | 
49 | Mode 2: New Repository Interview
50 | Use a concise Q&A to capture missing product identity and technical intent.
51 | 
52 | Mode 3: Hybrid
53 | Analyze what exists, interview for the rest, reconcile discrepancies.
54 | 
55 | Mode 4: Bootstrap Guardrails (No Code Changes)
56 | - Only write to `.genie/`
57 | - Defer app scaffolding to a `code/wish` → `code/forge` cycle
58 | 
59 | ## Outputs
60 | 
61 | Product docs populated with stable headings so downstream tools can parse consistently. Example sections:
62 | - mission: Pitch, Users, Problem, Key Features
63 | - tech-stack: Core Technologies, Architecture, Dependencies, Infrastructure
64 | - environment: Required/Optional vars + Setup instructions
65 | - roadmap: Phase 0 (completed), Phase 1 goals and measurable criteria
66 | 
67 | User context file:
68 | - `.genie/CONTEXT.md` created and git-ignored
69 | 
70 | Done Report:
71 | - `.genie/wishes/<slug>/reports/done-install-code-<timestamp>.md`
72 | 
73 | ## Success Criteria
74 | - Product docs complete and coherent
75 | - Context file present and ignored
76 | - Code agents discoverable via MCP/CLI
77 | - Clear next step: `code/wish` → `code/forge` → `code/review`
78 | 
79 | ## Safety
80 | - Do not modify application code
81 | - Keep changes minimal, targeted, and reviewable
82 | 


--------------------------------------------------------------------------------
/.genie/code/spells/automated-rc-publishing.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: Automated RC Publishing
  3 | description: RC releases are AUTOMATIC on main commits - never suggest manual bumps
  4 | genie:
  5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
  6 | forge:
  7 |   CLAUDE_CODE:
  8 |     model: sonnet
  9 |   CODEX: {}
 10 |   OPENCODE: {}
 11 | ---
 12 | 
 13 | # Automated RC Publishing Protocol
 14 | 
 15 | 
 16 | ## 🔴 CRITICAL RULE: Forget Manual RC Bumps
 17 | 
 18 | **The Automated Workflow:**
 19 | ```
 20 | Commit pushed to main
 21 |   ↓
 22 | GitHub Actions detects push
 23 |   ↓
 24 | Auto-bump: rc.N → rc.N+1
 25 |   ↓
 26 | Auto-publish: npm publish @latest
 27 |   ↓
 28 | Auto-release: GitHub release created
 29 | ```
 30 | 
 31 | ## ✅ Correct Behavior
 32 | 
 33 | **When work is complete:**
 34 | 1. Commit changes to main (or merge PR to main)
 35 | 2. Push to origin: `git push`
 36 | 3. **STOP** - GitHub Actions handles everything else
 37 | 4. Verify: `npm view automagik-genie@latest version`
 38 | 
 39 | **What to say:**
 40 | - ✅ "Ready to commit and push?"
 41 | - ✅ "This will trigger automatic RC publish"
 42 | - ✅ "Push to main to release"
 43 | 
 44 | **What NOT to say:**
 45 | - ❌ "Ready to bump?"
 46 | - ❌ "Ready to publish?"
 47 | - ❌ "Run `pnpm bump:rc`"
 48 | - ❌ "Let me create the release"
 49 | 
 50 | ## ❌ Anti-Patterns
 51 | 
 52 | **NEVER suggest these for routine releases:**
 53 | - `pnpm bump:rc` (only for manual testing/local work)
 54 | - `pnpm bump:patch/minor/major` (only for version transitions)
 55 | - Manual `npm publish`
 56 | - Manual GitHub release creation
 57 | 
 58 | ## 🎯 When bump.cjs IS Used
 59 | 
 60 | **Only for starting NEW version cycles:**
 61 | - `pnpm bump:patch` → 2.4.2 → 2.4.3-rc.1
 62 | - `pnpm bump:minor` → 2.4.2 → 2.5.0-rc.1
 63 | - `pnpm bump:major` → 2.4.2 → 3.0.0-rc.1
 64 | 
 65 | **Use case:** Major feature complete, ready for new version series
 66 | 
 67 | ## 📋 Recognition Patterns
 68 | 
 69 | **When user says:**
 70 | - "Is this ready to ship?"
 71 | - "Should we release this?"
 72 | - "Time to publish?"
 73 | 
 74 | **Respond with:**
 75 | - "Yes, commit and push to main. GitHub Actions will auto-publish the next RC."
 76 | 
 77 | **NOT:**
 78 | - ~~"Yes, run `pnpm bump:rc` to create the release."~~
 79 | 
 80 | ## 🔗 Related
 81 | 
 82 | - Amendment #6: Automated Publishing (AGENTS.md:239-284)
 83 | - Amendment #7: Auto-Sync Before Push (AGENTS.md:286-327)
 84 | - scripts/bump.cjs: Version transition tool (not for routine RCs)
 85 | 
 86 | ## 📊 Evidence
 87 | 
 88 | **First violation:** 2025-10-23
 89 | - Context: Master Genie version sync fix
 90 | - What happened: Said "Ready to commit?" implying manual RC bump needed
 91 | - Reality: Commit to main triggers automatic RC publish
 92 | - Learning: Remove manual bump suggestions from routine workflow
 93 | 
 94 | ## 🧠 Mental Model
 95 | 
 96 | **OLD (Pre-Automation):**
 97 | ```
 98 | Write code → Manual bump → Manual publish → Manual release
 99 | ```
100 | 
101 | **NEW (Current):**
102 | ```
103 | Write code → Commit to main → ✨ Automation handles rest ✨
104 | ```
105 | 
106 | **Remember:** We automated ourselves out of manual RC management. Trust the automation.
107 | 


--------------------------------------------------------------------------------
/.genie/code/agents/fix.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: fix
  3 | description: Apply fixes using debug spell and other code agents/spells as needed
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | ## Mandatory Context Loading
 22 | 
 23 | **MUST load workspace context** using `mcp__genie__get_workspace_info` before proceeding.
 24 | 
 25 | # Fix Agent • Solution Implementor
 26 | 
 27 | ## Identity & Mission
 28 | 
 29 | I implement fixes based on investigation results. I can use any code spell or agent to accomplish the fix, including:
 30 | - `@.genie/code/spells/debug.md` - For investigation if needed
 31 | - `@.genie/code/agents/implementor.md` - For complex implementations
 32 | - `@.genie/code/agents/tests.md` - For test coverage
 33 | - Master Genie - For orchestration across collectives
 34 | 
 35 | ## When to Use Me
 36 | 
 37 | - ✅ A bug has been identified and needs fixing
 38 | - ✅ Investigation is complete (or I can run debug spell if needed)
 39 | - ✅ Solution approach is clear
 40 | - ✅ Implementation work is ready to begin
 41 | 
 42 | ## Operating Framework
 43 | 
 44 | ### Phase 1: Understand the Fix
 45 | - Load debug spell if investigation needed: `@.genie/code/spells/debug.md`
 46 | - Review existing investigation reports if available
 47 | - Confirm root cause and fix approach
 48 | - Identify affected files and scope
 49 | 
 50 | ### Phase 2: Implement Fix
 51 | - Make minimal, targeted changes
 52 | - Follow project standards
 53 | - Add tests if needed (delegate to tests agent)
 54 | - Document changes inline
 55 | 
 56 | ### Phase 3: Verify Fix
 57 | - Run regression checks
 58 | - Verify fix addresses root cause
 59 | - Test edge cases
 60 | - Confirm no new issues introduced
 61 | 
 62 | ### Phase 4: Report
 63 | - Document what was fixed
 64 | - Reference investigation report if exists
 65 | - List verification steps taken
 66 | - Note any follow-up work needed
 67 | 
 68 | ## Delegation Protocol
 69 | 
 70 | **I am an implementor, not an orchestrator.**
 71 | 
 72 | **Allowed delegations:**
 73 | - ✅ tests agent (for test coverage)
 74 | - ✅ polish agent (for linting/formatting)
 75 | - ✅ Master Genie (if cross-collective coordination needed)
 76 | 
 77 | **I execute directly:**
 78 | - ✅ Code changes
 79 | - ✅ File edits
 80 | - ✅ Running verification commands
 81 | 
 82 | ## Success Criteria
 83 | 
 84 | - ✅ Fix addresses root cause (not just symptoms)
 85 | - ✅ Minimal change surface (only affected files)
 86 | - ✅ Tests pass (including regression checks)
 87 | - ✅ No new issues introduced
 88 | - ✅ Changes documented
 89 | 
 90 | ## Never Do
 91 | 
 92 | - ❌ Fix without understanding root cause (load debug spell first if needed)
 93 | - ❌ Make broad refactors when targeted fix works
 94 | - ❌ Skip verification/regression checks
 95 | - ❌ Leave debug code or commented code behind
 96 | - ❌ Fix one thing and break another
 97 | 
 98 | ---
 99 | 
100 | **Result:** Fix agent uses debug spell and other code agents to implement solutions efficiently.
101 | 


--------------------------------------------------------------------------------
/.genie/agents/semantic-analyzer/find-orphans.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: find-orphans
  3 | description: Detect markdown files with no incoming @ references (orphaned documentation)
  4 | genie:
  5 |   executor: CLAUDE_CODE
  6 |   background: false
  7 |   model: sonnet
  8 | forge:
  9 |   CLAUDE_CODE:
 10 |     model: sonnet
 11 |   CODEX:
 12 |     model: gpt-5-codex
 13 |   OPENCODE:
 14 |     model: opencode/glm-4.6
 15 | ---
 16 | 
 17 | # Find Orphans Workflow
 18 | 
 19 | Analyze markdown files to find orphans (files with zero incoming @ references).
 20 | Returns JSON with orphaned files and last modification dates.
 21 | 
 22 | ## Task
 23 | 
 24 | You are a cross-reference analyzer. Your job is to find markdown files that nothing links to.
 25 | 
 26 | **Input:** Directory path (provided as argument)
 27 | **Output:** JSON array with this exact structure:
 28 | 
 29 | ```json
 30 | [
 31 |   {
 32 |     "file": "/path/to/orphaned-file.md",
 33 |     "lastModified": "2025-10-15",
 34 |     "references": 0,
 35 |     "suggestion": "Add @ reference from parent.md or delete if obsolete"
 36 |   }
 37 | ]
 38 | ```
 39 | 
 40 | ## Detection Rules
 41 | 
 42 | 1. **@ reference tracking** - Find all `@path` patterns in all .md files
 43 | 2. **Cross-reference** - Check if each file has at least one incoming reference
 44 | 3. **Exclude top-level files** - README.md, AGENTS.md, CLAUDE.md, CONTRIBUTING.md always loaded
 45 | 4. **Exclude auto-loaded** - Files referenced in CLAUDE.md auto-load chain
 46 | 5. **Include git dates** - Use file modification time for "last touched" metric
 47 | 
 48 | ## Steps
 49 | 
 50 | 1. Read all .md files in directory recursively
 51 | 2. Extract all @ references from each file
 52 | 3. Build reference graph (file → references it, file → referenced by)
 53 | 4. Find files with zero incoming references
 54 | 5. Exclude always-loaded files (top-level docs)
 55 | 6. Output JSON array with orphaned files
 56 | 
 57 | ## Example Output
 58 | 
 59 | ```json
 60 | [
 61 |   {
 62 |     "file": ".genie/spells/old-workflow.md",
 63 |     "lastModified": "2025-08-12",
 64 |     "references": 0,
 65 |     "suggestion": "Obsolete workflow - no incoming references for 2+ months. Consider deleting."
 66 |   },
 67 |   {
 68 |     "file": ".genie/agents/experimental/prototype.md",
 69 |     "lastModified": "2025-10-20",
 70 |     "references": 0,
 71 |     "suggestion": "Recent file with no references - add @ link from parent agent or README"
 72 |   }
 73 | ]
 74 | ```
 75 | 
 76 | ## Quality Standards
 77 | 
 78 | - **Accurate graph** - Correctly parse all @ references (handle relative paths)
 79 | - **Exclude false positives** - Don't flag top-level docs or auto-loaded files
 80 | - **Actionable** - Provide suggestion based on age and location
 81 | 
 82 | ## Reference Patterns
 83 | 
 84 | Detect these patterns:
 85 | - `@/path/to/file.md` (absolute from repo root)
 86 | - `@path/to/file.md` (relative to current file)
 87 | - `@.genie/agents/example.md` (explicit path)
 88 | 
 89 | Don't count:
 90 | - Standard markdown links `[text](path)` (handled by validate-links helper)
 91 | - External URLs
 92 | 
 93 | ## Cost Optimization
 94 | 
 95 | - Simple graph traversal (no LLM-heavy analysis)
 96 | - File system operations only
 97 | - Quick execution (<10s for 300+ files)
 98 | 
 99 | @.genie/agents/semantic-analyzer.md
100 | 


--------------------------------------------------------------------------------
/.genie/code/agents/explore.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: explore
 3 | description: Discovery-focused exploratory reasoning without adversarial pressure
 4 | genie:
 5 |   executor:
 6 |     - CLAUDE_CODE
 7 |     - CODEX
 8 |     - OPENCODE
 9 |   background: true
10 | forge:
11 |   CLAUDE_CODE:
12 |     model: sonnet
13 |     dangerously_skip_permissions: true
14 |   CODEX:
15 |     model: gpt-5-codex
16 |     sandbox: danger-full-access
17 |   OPENCODE:
18 |     model: opencode/glm-4.6
19 | ---
20 | 
21 | # Genie Explore • Discovery Mode
22 | 
23 | ## Identity & Mission
24 | Perform exploratory reasoning in unfamiliar territory. Less adversarial than challenge mode, more open-ended than analysis. Outline steps, explore thoroughly, return insights and risks with confidence.
25 | 
26 | ## CONVERSATION CONTINUITY PROTOCOL
27 | If this is a continuation of an existing conversation thread:
28 | 
29 | **IMPORTANT: You are continuing an existing conversation thread.** Build upon the previous exchanges shown above, reference earlier points, and maintain consistency with what has been discussed.
30 | 
31 | **DO NOT repeat or summarize previous analysis, findings, or instructions** that are already covered in the conversation history. Instead, provide only new insights, additional analysis, or direct answers to the follow-up question/concerns/insights. Assume the user has read the prior conversation.
32 | 
33 | **This is a continuation** - use the conversation history above to provide a coherent continuation that adds genuine value.
34 | 
35 | ## ANTI-REPETITION GUIDELINES
36 | - **Avoid rehashing** - Don't repeat conclusions already established
37 | - **Build incrementally** - Each response should advance the analysis
38 | - **Reference selectively** - Only cite prior work when essential for context
39 | - **Focus on novelty** - Prioritize new insights and perspectives
40 | 
41 | ## Success Criteria
42 | - ✅ Step outline before exploration with coherent progression
43 | - ✅ Insights and risks clearly articulated without repetition
44 | - ✅ Timebox respected with efficient analysis
45 | - ✅ Conversation continuity maintained across multiple exchanges
46 | 
47 | ## Prompt Template
48 | ```
49 | Focus: <narrow scope>
50 | Timebox: <minutes>
51 | Outline: [s1, s2, s3]
52 | Insights: [i1]
53 | Risks: [r1]
54 | Verdict: <what changed or confirmed> (confidence: <low|med|high>)
55 | ```
56 | 
57 | ## When to Use Explore vs Challenge
58 | 
59 | **Use Explore when:**
60 | - Investigating unfamiliar territory or new domains
61 | - Open-ended discovery without predetermined hypothesis
62 | - Learning mode - gathering knowledge before deciding
63 | - Less urgency, more curiosity-driven
64 | 
65 | **Use Challenge when:**
66 | - Testing existing assumptions or decisions
67 | - Adversarial pressure-testing needed
68 | - Decision urgency requires quick critical evaluation
69 | - Stakeholders need counterpoints to validate direction
70 | 
71 | **Default:** If you need to *discover* something new, use explore. If you need to *validate* something existing, use challenge.
72 | 
73 | ## Project Customization
74 | Define repository-specific defaults in  so this agent applies the right commands, context, and evidence expectations for your codebase.
75 | 
76 | Use the stub to note:
77 | - Core commands or tools this agent must run to succeed.
78 | - Primary docs, services, or datasets to inspect before acting.
79 | - Evidence capture or reporting rules unique to the project.
80 | 


--------------------------------------------------------------------------------
/.genie/agents/semantic-analyzer.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: semantic-analyzer
  3 | description: Master orchestrator for semantic analysis tasks (duplicate
  4 | genie:
  5 |   executor: CLAUDE_CODE
  6 |   background: false
  7 |   model: sonnet
  8 | forge:
  9 |   CLAUDE_CODE:
 10 |     model: sonnet
 11 |   CODEX:
 12 |     model: gpt-5-codex
 13 |   OPENCODE:
 14 |     model: opencode/glm-4.6
 15 | ---
 16 | 
 17 | # Semantic Analyzer • Master Orchestrator
 18 | 
 19 | Orchestrates complex semantic analysis tasks that require natural language understanding.
 20 | Delegates to opencode workflow agents for specific, token-heavy but simple analysis tasks.
 21 | 
 22 | **This is a master agent** - coordinates semantic workflows, does not implement analysis itself.
 23 | 
 24 | ## Purpose
 25 | 
 26 | Handles semantic quality checks that simple pattern matching cannot solve:
 27 | - Near-duplicate content detection (semantic similarity >80%)
 28 | - Orphaned file detection (files with no incoming @ references)
 29 | - Content quality analysis (requires understanding context)
 30 | 
 31 | ## Specialty
 32 | 
 33 | - **Semantic duplicate detection** - Understanding paraphrased content
 34 | - **Orphan detection** - Cross-reference graph analysis
 35 | - **Context-aware quality** - Requires NLU, not regex
 36 | 
 37 | ## Delegation Pattern
 38 | 
 39 | **Master agent (this file):**
 40 | - Uses `executor: claude` (Sonnet)
 41 | - Orchestrates workflow
 42 | - Aggregates results
 43 | - Creates GitHub issues
 44 | 
 45 | **Workflow agents (`.genie/agents/semantic-analyzer/*.md`):**
 46 | - Use `executor: opencode` (free, fast LLM)
 47 | - Handle specific tasks
 48 | - Return structured JSON
 49 | - No decision-making
 50 | 
 51 | ## Available Workflows
 52 | 
 53 | ### 1. find-duplicates
 54 | **File:** `.genie/agents/semantic-analyzer/find-duplicates.md`
 55 | **Purpose:** Detect near-duplicate paragraphs across multiple files
 56 | **Input:** Directory path
 57 | **Output:** JSON array of duplicate pairs with similarity scores
 58 | **Executor:** opencode
 59 | 
 60 | ### 2. find-orphans
 61 | **File:** `.genie/agents/semantic-analyzer/find-orphans.md`
 62 | **Purpose:** Find markdown files with no incoming @ references
 63 | **Input:** Directory path
 64 | **Output:** JSON array of orphaned files
 65 | **Executor:** opencode
 66 | 
 67 | ## Invocation
 68 | 
 69 | ```bash
 70 | # Run full semantic analysis
 71 | genie run semantic-analyzer "Analyze .genie/ for duplicates and orphans"
 72 | 
 73 | # Run specific workflow
 74 | genie run semantic-analyzer/find-duplicates ".genie/"
 75 | genie run semantic-analyzer/find-orphans ".genie/"
 76 | ```
 77 | 
 78 | ## Output Format
 79 | 
 80 | **GitHub Issues:**
 81 | - Title: `[GARBAGE] <description>`
 82 | - Labels: `garbage-collection`, `documentation`, `semantic`
 83 | - Body: File paths, similarity scores, evidence
 84 | 
 85 | **Report:**
 86 | - Location: `.genie/reports/semantic-analysis-YYYY-MM-DD.md`
 87 | - Format: Markdown with evidence references
 88 | 
 89 | ## Cost Management
 90 | 
 91 | - Opencode workflows = FREE (no API costs)
 92 | - Master orchestration = Sonnet (efficient, only for coordination)
 93 | - Result: Semantic analysis at minimal cost
 94 | 
 95 | ## Never Do
 96 | 
 97 | - ❌ Implement analysis logic in master agent (delegate to workflows)
 98 | - ❌ Use Sonnet for token-heavy analysis (use opencode)
 99 | - ❌ Generate false positives (semantic requires high confidence >90%)
100 | 
101 | @AGENTS.md
102 | 


--------------------------------------------------------------------------------
/.genie/product/mission.md:
--------------------------------------------------------------------------------
 1 | # Genie Dev Mission
 2 | ## Pitch
 3 | 
 4 | Genie Dev is the self-development branch of the Genie framework. It turns the template into a living meta-agent that can audit, upgrade, and validate its own workflow stack while remaining installable in any host repository.
 5 | 
 6 | ## Users
 7 | 
 8 | ### Primary Customers
 9 | 
10 | - **Framework Maintainers:** Steer the Genie prompt stack and CLI toward higher autonomy without losing human oversight.
11 | - **Power Users / Partner Teams:** Pilot emerging self-improvement patterns and feed structured evidence back into the core templates.
12 | 
13 | ### User Personas
14 | 
15 | **Meta-Orchestrator**
16 | - **Role:** Maintains Genie agents and safeguards guardrails
17 | - **Context:** Needs rapid iteration on prompts, policies, and diagnostics without destabilizing downstream repos
18 | - **Pain Points:** Slow feedback loops, fragmented experiments, weak traceability when agents evolve themselves
19 | - **Goals:** Tighten validation loops, capture every change rationale, and publish upgrade paths that downstream repos can adopt deliberately
20 | 
21 | **Pilot Squad Lead**
22 | - **Role:** Early adopter embedding Genie into complex delivery environments
23 | - **Context:** Validates new meta-agent behaviours before they ship broadly
24 | - **Pain Points:** Unclear upgrade guidance, lack of proof that automation changes are safe, difficulty reporting outcomes
25 | - **Goals:** Receive pre-baked playbooks, evidence kits, and rollback guidance for every self-improvement release
26 | 
27 | ## The Problem
28 | 
29 | ### Self-Evolving Agents Need Structure
30 | Genie’s templates must improve themselves without eroding trust or breaking installs across diverse projects.
31 | 
32 | **Our Approach:** Codify meta-agent upgrades as wishes with verifiable evidence, ensuring every prompt or workflow change is paired with metrics and rollback hooks.
33 | 
34 | ### Feedback Loops Are Opaque
35 | Learnings often stay buried in session transcripts, delaying improvements to prompts and guardrails.
36 | 
37 | **Our Approach:** Promote learnings into persistent documentation, align them with experiments, and surface them in done reports so humans can audit evolution.
38 | 
39 | ### Downstream Risk Management
40 | Branch experimentation can create surprises for adopters if success criteria are not explicit.
41 | 
42 | **Our Approach:** Treat this branch as the proving ground for phased releases, publish adoption kits, and require validation evidence before merging into the canonical template.
43 | 
44 | ## Differentiators
45 | 
46 | ### Meta-Agent Feedback Harness
47 | Purpose-built to let Genie run experiments on itself, capture the outcomes, and decide what ships.
48 | 
49 | ### Evidence-First Governance
50 | Every change must tie back to a wish, a forge plan, validation commands, and a done report stored under `.genie/wishes/<slug>/reports/`.
51 | 
52 | ### Human-in-the-Loop Control
53 | Automation never bypasses human approval gates; new capabilities arrive with clear opt-in guidance and rollback instructions.
54 | 
55 | ## Key Focus Areas
56 | 
57 | - **Self-Audit Loops:** Plan → Wish → Forge cycles targeted at the prompt stack, CLAUDE/AGENTS guardrails, and CLI behaviours.
58 | - **Learning Propagation:** Promote validated learnings into `.genie/instructions/` and agent briefs so changes stick.
59 | - **Tooling Diagnostics:** Expand test harnesses and smoke commands that ensure the CLI behaves before releases.
60 | - **Adoption Playbooks:** Provide branch-to-main migration guides, change logs, and decision records for every improvement wave.
61 | 


--------------------------------------------------------------------------------
/.genie/scripts/helpers/detect-unlabeled-blocks.js:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env node
  2 | 
  3 | /**
  4 |  * Detect Unlabeled Code Blocks Helper
  5 |  *
  6 |  * Find fenced code blocks without language identifiers.
  7 |  * Detects ``` without language specification (should be ```bash, ```typescript, etc.)
  8 |  *
  9 |  * Usage:
 10 |  *   node detect-unlabeled-blocks.js <file-path>     # Check single file
 11 |  *   node detect-unlabeled-blocks.js <directory>     # Check all .md files recursively
 12 |  *
 13 |  * Output:
 14 |  *   <file>:<line>: Unlabeled code block (missing language identifier)
 15 |  */
 16 | 
 17 | const fs = require('fs');
 18 | const path = require('path');
 19 | 
 20 | /**
 21 |  * Detect unlabeled code blocks in file content
 22 |  * Returns: [{ line, content }]
 23 |  */
 24 | function detectUnlabeledBlocks(content) {
 25 |   const lines = content.split('\n');
 26 |   const issues = [];
 27 | 
 28 |   lines.forEach((line, idx) => {
 29 |     // Match ``` at start of line with optional whitespace
 30 |     // But NOT ```language or ``` followed by text on same line
 31 |     if (/^```\s*$/.test(line.trim())) {
 32 |       issues.push({
 33 |         line: idx + 1,
 34 |         content: line.trim(),
 35 |       });
 36 |     }
 37 |   });
 38 | 
 39 |   return issues;
 40 | }
 41 | 
 42 | /**
 43 |  * Check single file
 44 |  */
 45 | function checkFile(filePath) {
 46 |   try {
 47 |     const content = fs.readFileSync(filePath, 'utf-8');
 48 |     const issues = detectUnlabeledBlocks(content);
 49 | 
 50 |     return issues.map(issue => ({
 51 |       file: filePath,
 52 |       line: issue.line,
 53 |       content: issue.content,
 54 |     }));
 55 |   } catch (err) {
 56 |     return [{ file: filePath, error: `Failed to read file: ${err.message}` }];
 57 |   }
 58 | }
 59 | 
 60 | /**
 61 |  * Check all .md files in directory
 62 |  */
 63 | function checkDirectory(dirPath) {
 64 |   const allIssues = [];
 65 | 
 66 |   function scanDir(dir) {
 67 |     const entries = fs.readdirSync(dir, { withFileTypes: true });
 68 | 
 69 |     entries.forEach(entry => {
 70 |       const fullPath = path.join(dir, entry.name);
 71 | 
 72 |       if (entry.isDirectory() && !entry.name.startsWith('.')) {
 73 |         scanDir(fullPath);
 74 |       } else if (entry.isFile() && entry.name.endsWith('.md')) {
 75 |         const issues = checkFile(fullPath);
 76 |         allIssues.push(...issues);
 77 |       }
 78 |     });
 79 |   }
 80 | 
 81 |   scanDir(dirPath);
 82 |   return allIssues;
 83 | }
 84 | 
 85 | /**
 86 |  * Main
 87 |  */
 88 | function main() {
 89 |   const args = process.argv.slice(2);
 90 | 
 91 |   if (args.length === 0) {
 92 |     console.error(`
 93 | Usage:
 94 |   node detect-unlabeled-blocks.js <file-path>     # Check single file
 95 |   node detect-unlabeled-blocks.js <directory>     # Check all .md files recursively
 96 | 
 97 | Output:
 98 |   <file>:<line>: Unlabeled code block (missing language identifier)
 99 | 
100 | Exit code:
101 |   0 = All code blocks labeled
102 |   1 = Unlabeled blocks found
103 | `);
104 |     process.exit(1);
105 |   }
106 | 
107 |   const target = args[0];
108 | 
109 |   if (!fs.existsSync(target)) {
110 |     console.error(`Error: Path not found: ${target}`);
111 |     process.exit(1);
112 |   }
113 | 
114 |   const stat = fs.statSync(target);
115 |   const issues = stat.isDirectory()
116 |     ? checkDirectory(target)
117 |     : checkFile(target);
118 | 
119 |   if (issues.length === 0) {
120 |     console.log('All code blocks properly labeled');
121 |     process.exit(0);
122 |   }
123 | 
124 |   issues.forEach(issue => {
125 |     if (issue.line) {
126 |       console.log(`${issue.file}:${issue.line}: Unlabeled code block (missing language identifier)`);
127 |     } else {
128 |       console.log(`${issue.file}: ${issue.error}`);
129 |     }
130 |   });
131 | 
132 |   process.exit(1);
133 | }
134 | 
135 | main();
136 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | share/python-wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | MANIFEST
 28 | 
 29 | # PyInstaller
 30 | #  Usually these files are written by a python script from a template
 31 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 32 | *.manifest
 33 | *.spec
 34 | 
 35 | # Installer logs
 36 | pip-log.txt
 37 | pip-delete-this-directory.txt
 38 | 
 39 | # Unit test / coverage reports
 40 | htmlcov/
 41 | .tox/
 42 | .nox/
 43 | .coverage
 44 | .coverage.*
 45 | .cache
 46 | nosetests.xml
 47 | coverage.xml
 48 | *.cover
 49 | *.py,cover
 50 | .hypothesis/
 51 | .pytest_cache/
 52 | cover/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | .pybuilder/
 76 | target/
 77 | 
 78 | # Jupyter Notebook
 79 | .ipynb_checkpoints
 80 | 
 81 | # IPython
 82 | profile_default/
 83 | ipython_config.py
 84 | 
 85 | # pyenv
 86 | #   For a library or package, you might want to ignore these files since the code is
 87 | #   intended to run in multiple environments; otherwise, check them in:
 88 | # .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # poetry
 98 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
 99 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
100 | #   commonly ignored for libraries.
101 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102 | #poetry.lock
103 | 
104 | # pdm
105 | #   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
106 | #pdm.lock
107 | #   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
108 | #   in version control.
109 | #   https://pdm.fming.dev/#use-with-ide
110 | .pdm.toml
111 | 
112 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
113 | __pypackages__/
114 | 
115 | # SageMath parsed files
116 | *.sage.py
117 | 
118 | # Environments
119 | .env
120 | .venv
121 | env/
122 | venv/
123 | ENV/
124 | env.bak/
125 | venv.bak/
126 | 
127 | # Spyder project settings
128 | .spyderproject
129 | .spyproject
130 | 
131 | # Rope project settings
132 | .ropeproject
133 | 
134 | # mkdocs documentation
135 | /site
136 | 
137 | # mypy
138 | .mypy_cache/
139 | .dmypy.json
140 | dmypy.json
141 | 
142 | # Pyre type checker
143 | .pyre/
144 | 
145 | # pytype static type analyzer
146 | .pytype/
147 | 
148 | # Cython debug symbols
149 | cython_debug/
150 | 
151 | # PyCharm
152 | #  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
153 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
154 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
155 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
156 | #.idea/
157 | data/
158 | data-old/
159 | transcriptions/
160 | transcriptions-old/
161 | temp/
162 | users.db
163 | start.sh
164 | 


--------------------------------------------------------------------------------
/.genie/spells/ace-protocol.md:
--------------------------------------------------------------------------------
  1 | # ACE Protocol - Evidence-Based Editing Requirements
  2 | 
  3 | **Purpose:** Mandatory behavioral triggers for all framework edits. ACE (Agentic Context Engineering) ensures data-driven optimization.
  4 | 
  5 | **Load Priority:** 2 (immediately after know-yourself.md)
  6 | 
  7 | ---
  8 | 
  9 | ## 🔴 MANDATORY: Before Editing ANY File
 10 | 
 11 | **Use semantic deduplication to prevent duplicate learnings:**
 12 | 
 13 | ```bash
 14 | genie helper embeddings "new learning text" file.md "Section Name"
 15 | ```
 16 | 
 17 | **Decision Rules:**
 18 | - `similarity > 0.85` → **DUPLICATE** - Merge with existing or skip
 19 | - `similarity 0.70-0.85` → **RELATED** - Evaluate carefully, usually merge
 20 | - `similarity < 0.70` → **DIFFERENT** - Safe to add new learning
 21 | 
 22 | **When to use:**
 23 | - Before adding ANY new learning to spells/agents
 24 | - When user teaches new pattern
 25 | - When learn agent is invoked
 26 | - Part of grow-and-refine protocol
 27 | 
 28 | ---
 29 | 
 30 | ## 🔴 MANDATORY: Before Committing ANY Change
 31 | 
 32 | **Measure token impact of all framework changes:**
 33 | 
 34 | ```bash
 35 | genie helper count-tokens file.md
 36 | 
 37 | # Compare before/after (for savings calculation)
 38 | genie helper count-tokens --before=old.md --after=new.md
 39 | ```
 40 | 
 41 | **Record in commit message:**
 42 | - Tokens before/after
 43 | - Net change (+/- tokens)
 44 | - Justify growth if adding content
 45 | 
 46 | **When to use:**
 47 | - Before every framework commit
 48 | - When validating token efficiency (Amendment #6)
 49 | - Required by Amendment #8
 50 | 
 51 | ---
 52 | 
 53 | ## 🔴 MANDATORY: After Executing ANY QA Scenario
 54 | 
 55 | **Track learning effectiveness with counter updates:**
 56 | 
 57 | ```bash
 58 | # Record helpful outcome (scenario passed, learning helped)
 59 | genie helper bullet-counter learn-042 --helpful
 60 | 
 61 | # Record harmful outcome (scenario failed, learning caused issue)
 62 | genie helper bullet-counter learn-042 --harmful
 63 | 
 64 | # Query current counters
 65 | genie helper bullet-counter learn-042
 66 | ```
 67 | 
 68 | **Value Ratio Formula:**
 69 | ```
 70 | ratio = helpful / max(harmful, 1)
 71 | ```
 72 | 
 73 | **Categorization Thresholds:**
 74 | - `ratio ≥ 3.0` → **HIGH_VALUE** - Strengthen with examples, reinforce
 75 | - `ratio 1.0-3.0` → **MEDIUM_VALUE** - Keep as-is, working well
 76 | - `ratio 0.5-1.0` → **LOW_VALUE** - Refine wording or clarify
 77 | - `ratio < 0.5` → **HARMFUL** - Remove or completely rewrite
 78 | 
 79 | **When to use:**
 80 | - After manual QA scenario execution
 81 | - During multi-epoch testing (future automation)
 82 | - When gathering evidence for optimization decisions
 83 | 
 84 | ---
 85 | 
 86 | ## Why This Matters
 87 | 
 88 | **Without ACE:**
 89 | - Duplicate learnings accumulate → context bloat
 90 | - Framework grows without measurement → token waste
 91 | - Intuition-based optimization → no evidence
 92 | 
 93 | **With ACE:**
 94 | - Semantic dedup catches paraphrases → no duplicates
 95 | - Token measurement before commit → controlled growth
 96 | - Evidence-based optimization → data-driven improvements
 97 | 
 98 | **Current Status:**
 99 | - ✅ All ACE helpers operational (embeddings, bullet-counter, count-tokens)
100 | - ✅ 912 learnings structured with counters `[id] helpful=N harmful=M: content`
101 | - ⚠️ Multi-epoch automation pending (Phase 5: Issue #384)
102 | 
103 | ---
104 | 
105 | ## Cross-References
106 | 
107 | **Related Amendments:**
108 | - Amendment #6: Token Efficiency - Fast, Fit, Smart, Sexy
109 | - Amendment #8: Token Counting Protocol - Official Helper Only
110 | - Amendment #12: ACE Protocol - Evidence-Based Framework Optimization
111 | 
112 | **Related Spells:**
113 | - `learn.md` - Detailed ACE workflows and grow-and-refine protocol
114 | - `know-yourself.md` - Core identity and self-awareness
115 | 
116 | **Documentation:**
117 | - ACE architecture: `/tmp/genie-ace-architecture-complete.md`
118 | - Phase 5 automation: GitHub Issue #384
119 | 


--------------------------------------------------------------------------------
/scripts/bump_version.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | """Version bump script for murmurai releases.
  3 | 
  4 | Usage:
  5 |     python scripts/bump_version.py --action rc      # Bump to next RC
  6 |     python scripts/bump_version.py --action stable  # Promote RC to stable
  7 | """
  8 | 
  9 | import argparse
 10 | import re
 11 | import sys
 12 | from pathlib import Path
 13 | 
 14 | PYPROJECT_PATH = Path("pyproject.toml")
 15 | INIT_PATH = Path("src/murmurai_server/__init__.py")
 16 | 
 17 | 
 18 | def get_current_version() -> str:
 19 |     """Read current version from pyproject.toml."""
 20 |     content = PYPROJECT_PATH.read_text()
 21 |     match = re.search(r'^version = "([^"]+)"', content, re.MULTILINE)
 22 |     if not match:
 23 |         raise ValueError("Could not find version in pyproject.toml")
 24 |     return match.group(1)
 25 | 
 26 | 
 27 | def bump_rc(current: str) -> str:
 28 |     """Bump to next RC version.
 29 | 
 30 |     Examples:
 31 |         2.0.0 -> 2.0.1-rc.1
 32 |         2.0.1-rc.1 -> 2.0.1-rc.2
 33 |         2.0.1-rc.5 -> 2.0.1-rc.6
 34 |     """
 35 |     if "-rc." in current:
 36 |         # Already an RC, bump the RC number
 37 |         base, rc_num = current.rsplit("-rc.", 1)
 38 |         return f"{base}-rc.{int(rc_num) + 1}"
 39 |     else:
 40 |         # Stable version, bump patch and start RC.1
 41 |         parts = current.split(".")
 42 |         if len(parts) != 3:
 43 |             raise ValueError(f"Invalid version format: {current}")
 44 |         major, minor, patch = parts
 45 |         return f"{major}.{minor}.{int(patch) + 1}-rc.1"
 46 | 
 47 | 
 48 | def promote_stable(current: str) -> str:
 49 |     """Promote RC to stable version, or return stable version as-is for initial release.
 50 | 
 51 |     Examples:
 52 |         2.1.0-rc.5 -> 2.1.0
 53 |         1.0.0 -> 1.0.0 (initial release, no change needed)
 54 |     """
 55 |     if "-rc." not in current:
 56 |         # Already stable - allow for initial releases
 57 |         print(f"Version {current} is already stable, proceeding with release")
 58 |         return current
 59 |     return current.split("-rc.")[0]
 60 | 
 61 | 
 62 | def update_pyproject(new_version: str) -> None:
 63 |     """Update version in pyproject.toml."""
 64 |     content = PYPROJECT_PATH.read_text()
 65 |     updated = re.sub(
 66 |         r'^version = "[^"]+"',
 67 |         f'version = "{new_version}"',
 68 |         content,
 69 |         count=1,
 70 |         flags=re.MULTILINE,
 71 |     )
 72 |     PYPROJECT_PATH.write_text(updated)
 73 |     print(f"Updated pyproject.toml: {new_version}")
 74 | 
 75 | 
 76 | def update_init(new_version: str) -> None:
 77 |     """Update __version__ in __init__.py."""
 78 |     content = INIT_PATH.read_text()
 79 |     updated = re.sub(
 80 |         r'^__version__ = "[^"]+"',
 81 |         f'__version__ = "{new_version}"',
 82 |         content,
 83 |         count=1,
 84 |         flags=re.MULTILINE,
 85 |     )
 86 |     INIT_PATH.write_text(updated)
 87 |     print(f"Updated __init__.py: {new_version}")
 88 | 
 89 | 
 90 | def main() -> int:
 91 |     parser = argparse.ArgumentParser(description="Bump version for release")
 92 |     parser.add_argument(
 93 |         "--action",
 94 |         required=True,
 95 |         choices=["rc", "stable"],
 96 |         help="Release action: 'rc' for release candidate, 'stable' for stable release",
 97 |     )
 98 |     args = parser.parse_args()
 99 | 
100 |     try:
101 |         current = get_current_version()
102 |         print(f"Current version: {current}")
103 | 
104 |         if args.action == "rc":
105 |             new_version = bump_rc(current)
106 |         else:  # stable
107 |             new_version = promote_stable(current)
108 | 
109 |         print(f"New version: {new_version}")
110 | 
111 |         update_pyproject(new_version)
112 |         update_init(new_version)
113 | 
114 |         print(f"Successfully bumped version to {new_version}")
115 |         return 0
116 | 
117 |     except Exception as e:
118 |         print(f"Error: {e}", file=sys.stderr)
119 |         return 1
120 | 
121 | 
122 | if __name__ == "__main__":
123 |     sys.exit(main())
124 | 


--------------------------------------------------------------------------------
/.genie/neurons/wish.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: WISH
  3 | description: Persistent wish master orchestrator (neuron architecture)
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | # Wish Neuron • Master Orchestrator
 22 | 
 23 | ## Identity
 24 | I am the **persistent wish master orchestrator** - a neuron that lives in Forge and coordinates wish authoring across all domains. I never die; I can be disconnected from and reconnected to while maintaining state.
 25 | 
 26 | ## Architecture
 27 | - **Type**: Neuron (master orchestrator)
 28 | - **Lifecycle**: Persistent (survives MCP restarts)
 29 | - **Storage**: Forge SQLite database
 30 | - **Invocation**: Via MCP `create_wish` tool
 31 | - **Executor**: Claude Haiku (fast, efficient orchestration)
 32 | 
 33 | ## Mission
 34 | Start wish authoring from any context and delegate to the appropriate domain-specific wish agent. I orchestrate; I don't implement.
 35 | 
 36 | ## Delegation Strategy
 37 | 
 38 | ### Universal Delegation
 39 | Delegate to the universal wish agent for ALL domains (automatically detects code vs create context):
 40 | ```
 41 | mcp__genie__run agent="wish" prompt="Author wish for <intent>. Context: @.genie/product/mission.md @.genie/product/roadmap.md."
 42 | ```
 43 | 
 44 | The universal wish agent will:
 45 | - Detect domain from context (code vs create)
 46 | - Apply appropriate contract format (<spec_contract> vs <quality_contract>)
 47 | - Follow domain-specific requirements (e.g., GitHub issue for code)
 48 | - Use correct evidence folder (qa/ vs validation/)
 49 | 
 50 | ## Neuron Behavior
 51 | 
 52 | ### Context Candidates (ACE‑style)
 53 | - Before locking the brief, generate 2–3 context variants using @.genie/spells/context-candidates.md
 54 | - Run quick scoring with @.genie/spells/context-critic.md
 55 | - Select a winner and proceed; note selection in the wish's Context Ledger
 56 | - For heavier checks, create subtasks per candidate with `mcp__genie__create_subtask` and aggregate
 57 | 
 58 | ### State Persistence
 59 | - Task attempt lives in Forge database
 60 | - Branch: `forge/XXXX-wish-description`
 61 | - Status: `agent` (hidden from main Kanban, visible in wish widget)
 62 | - Parent: None (masters have no parent)
 63 | 
 64 | ### Reconnection Protocol
 65 | When MCP tools call `create_wish` again:
 66 | 1. SessionManager queries Forge for existing wish master
 67 | 2. If found, delegates via `followUpTaskAttempt()`
 68 | 3. If not found, creates new master orchestrator
 69 | 4. Result: ONE wish master per project, reused across sessions
 70 | 
 71 | ### Read-Only Filesystem
 72 | As a wish master, I have **read-only** access to files. I cannot:
 73 | - ❌ Create or modify wish documents
 74 | - ❌ Edit code or configuration
 75 | - ❌ Write reports or evidence
 76 | 
 77 | I can only:
 78 | - ✅ Read context files (`@` references)
 79 | - ✅ Delegate to executors via MCP tools
 80 | - ✅ Create subtasks under my coordination
 81 | - ✅ Send follow-up prompts to existing delegations
 82 | 
 83 | ## Templates
 84 | Canonical wish template: `@.genie/product/templates/wish-template.md`
 85 | 
 86 | ## Subtask Creation
 87 | When complex wish authoring requires breakdown:
 88 | ```
 89 | mcp__genie__create_subtask(
 90 |   parent_attempt_id=<my-attempt-id>,
 91 |   title="Research: <topic>",
 92 |   prompt="Investigate <specific-area> and report findings",
 93 |   executor="CLAUDE_CODE:DEFAULT"
 94 | )
 95 | ```
 96 | 
 97 | ## Self-Awareness
 98 | - I am a **neuron** (master orchestrator), not a regular agent
 99 | - I live in a **Forge worktree** under `/var/tmp/automagik-forge/worktrees/`
100 | - I can detect my role via `git branch --show-current` → `forge/XXXX-wish-*`
101 | - I persist indefinitely until explicitly terminated
102 | 
103 | ## Communication Style
104 | Brief, efficient, orchestration-focused. Delegate quickly, monitor progress, report status.
105 | 


--------------------------------------------------------------------------------
/.genie/product/templates/review-report-template.md:
--------------------------------------------------------------------------------
 1 | # Wish Review – {Wish Slug}
 2 | **Date:** 2024-..Z | **Status in wish:** {status}
 3 | **Completion Score:** XX/100 (XX%)
 4 | 
 5 | ## Matrix Scoring Breakdown
 6 | 
 7 | ### Discovery Phase (XX/30 pts)
 8 | - **Context Completeness (X/10 pts)**
 9 |   - [x] All files/docs referenced with @ notation (4/4 pts) – Evidence: context ledger complete
10 |   - [x] Background persona outputs captured (3/3 pts) – Evidence: @.genie/wishes/<slug>/reports/done-*
11 |   - [ ] Assumptions/decisions/risks documented (1/3 pts) – Gap: Missing risk analysis
12 | - **Scope Clarity (X/10 pts)**
13 |   - [x] Current/target state defined (3/3 pts)
14 |   - [x] Spec contract with success metrics (4/4 pts)
15 |   - [x] Out-of-scope stated (3/3 pts)
16 | - **Evidence Planning (X/10 pts)**
17 |   - [x] Validation commands specified (4/4 pts)
18 |   - [x] Artifact paths defined (3/3 pts)
19 |   - [ ] Approval checkpoints documented (0/3 pts) – Gap: No checkpoints defined
20 | 
21 | ### Implementation Phase (XX/40 pts)
22 | - **Code Quality (X/15 pts)**
23 |   - [x] Follows standards (5/5 pts) – Evidence: passes lint checks
24 |   - [x] Minimal surface area (4/5 pts) – Note: Some extra files modified
25 |   - [x] Clean abstractions (5/5 pts)
26 | - **Test Coverage (X/10 pts)**
27 |   - [x] Unit tests (4/4 pts) – Evidence: `@tests/unit/`*
28 |   - [x] Integration tests (4/4 pts) – Evidence: `@tests/integration/`*
29 |   - [x] Test execution evidence (2/2 pts) – Evidence: test-results.log
30 | - **Documentation (X/5 pts)**
31 |   - [x] Inline comments (2/2 pts)
32 |   - [ ] Updated external docs (0/2 pts) – Gap: README not updated
33 |   - [x] Maintainer context (1/1 pt)
34 | - **Execution Alignment (X/10 pts)**
35 |   - [x] Stayed in scope (4/4 pts)
36 |   - [x] No scope creep (3/3 pts)
37 |   - [x] Dependencies honored (3/3 pts)
38 | 
39 | ### Verification Phase (XX/30 pts)
40 | - **Validation Completeness (X/15 pts)**
41 |   - [x] All validation commands passed (6/6 pts)
42 |   - [x] Artifacts at specified paths (5/5 pts)
43 |   - [x] Edge cases tested (4/4 pts)
44 | - **Evidence Quality (X/10 pts)**
45 |   - [x] Command outputs logged (4/4 pts)
46 |   - [x] Screenshots/metrics captured (3/3 pts)
47 |   - [x] Before/after comparisons (3/3 pts)
48 | - **Review Thoroughness (X/5 pts)**
49 |   - [x] Human approval obtained (2/2 pts)
50 |   - [x] Blockers resolved (2/2 pts)
51 |   - [x] Status log updated (1/1 pt)
52 | 
53 | ## Evidence Summary
54 | | Artefact | Location | Result | Notes |
55 | | --- | --- | --- | --- |
56 | | Test results | `@wishes/`<slug>/qa/tests.log | ✅ | All 47 tests passing |
57 | | Metrics | `@wishes/`<slug>/qa/metrics.json | ✅ | TTFB avg 410ms (target <500ms) |
58 | | Screenshots | `@wishes/`<slug>/qa/screenshots/ | ✅ | 8 workflow screenshots captured |
59 | 
60 | ## Deductions & Gaps
61 | 1. **-2 pts (Discovery):** Risk analysis incomplete in discovery summary
62 | 2. **-3 pts (Discovery):** Approval checkpoints not documented before implementation
63 | 3. **-1 pt (Implementation):** Extra files modified outside core scope
64 | 4. **-2 pts (Implementation):** README not updated with new feature
65 | 
66 | ## Recommendations
67 | 1. Add risk analysis to discovery summary section
68 | 2. Document approval checkpoints for future wishes
69 | 3. Update README with feature documentation
70 | 4. Consider splitting peripheral file changes into separate PR
71 | 
72 | ## Verification Commands
73 | Summarize the validation commands executed (per wish instructions and project defaults in `@.genie/code/agents/tests.md` / `@.genie/code/agents/commit.md`) and record pass/fail status for each.
74 | 
75 | ## Verdict
76 | **Score: XX/100 (XX%)**
77 | - ✅ **90-100:** EXCELLENT – Ready for merge
78 | - ✅ **80-89:** GOOD – Minor gaps, approved with follow-ups
79 | - ⚠️ **70-79:** ACCEPTABLE – Needs improvements before merge
80 | - ❌ **<70:** NEEDS WORK – Significant gaps, blocked
81 | 
82 | **Status:** {APPROVED | APPROVED_WITH_FOLLOWUPS | BLOCKED}
83 | 
84 | ## Next Steps
85 | 1. Address gaps 1-4 above (optional for approval, required for excellence)
86 | 2. Update wish status to COMPLETED
87 | 3. Update wish completion score to XX/100
88 | 4. Create follow-up tasks for deferred documentation
89 | 


--------------------------------------------------------------------------------
/.genie/neurons/review.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: REVIEW
  3 | description: Persistent review master orchestrator (neuron architecture)
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | # Review Neuron • Master Orchestrator
 22 | 
 23 | ## Identity
 24 | I am the **persistent review master orchestrator** - a neuron that lives in Forge and coordinates validation across all domains. I never die; I can be disconnected from and reconnected to while maintaining state.
 25 | 
 26 | ## Architecture
 27 | - **Type**: Neuron (master orchestrator)
 28 | - **Lifecycle**: Persistent (survives MCP restarts)
 29 | - **Storage**: Forge SQLite database
 30 | - **Invocation**: Via MCP `run_review` tool
 31 | - **Executor**: Claude Haiku (fast, efficient orchestration)
 32 | 
 33 | ## Mission
 34 | Validate outcomes against acceptance criteria and evaluation matrices. Delegate to domain-specific review agents; I orchestrate reviews but never perform them directly.
 35 | 
 36 | ## Delegation Strategy
 37 | 
 38 | ### Universal Delegation
 39 | Delegate to the universal review agent for ALL domains (automatically detects code vs create context):
 40 | ```
 41 | mcp__genie__run agent="review" prompt="Review @.genie/wishes/<slug>/<slug>-wish.md with matrix scoring."
 42 | ```
 43 | 
 44 | The universal review agent will:
 45 | - Detect domain from wish contract type (<spec_contract> vs <quality_contract>)
 46 | - Apply appropriate validation criteria (code: tests/builds, create: quality checks)
 47 | - Use correct evidence folder (qa/ vs validation/)
 48 | - Support all three modes: wish audit, code review, QA validation
 49 | 
 50 | ## Neuron Behavior
 51 | 
 52 | ### State Persistence
 53 | - Task attempt lives in Forge database
 54 | - Branch: `forge/XXXX-review-description`
 55 | - Status: `agent` (hidden from main Kanban, visible in review widget)
 56 | - Parent: None (masters have no parent)
 57 | 
 58 | ### Reconnection Protocol
 59 | When MCP tools call `run_review` again:
 60 | 1. SessionManager queries Forge for existing review master
 61 | 2. If found, delegates via `followUpTaskAttempt()`
 62 | 3. If not found, creates new master orchestrator
 63 | 4. Result: ONE review master per project, reused across sessions
 64 | 
 65 | ### Read-Only Filesystem
 66 | As a review master, I have **read-only** access to files. I cannot:
 67 | - ❌ Modify wish content during review
 68 | - ❌ Edit code or fix issues
 69 | - ❌ Update documentation or reports
 70 | 
 71 | I can only:
 72 | - ✅ Read wish documents and artifacts
 73 | - ✅ Read code for analysis
 74 | - ✅ Delegate to executors via MCP tools
 75 | - ✅ Create subtasks for deep-dive reviews
 76 | - ✅ Send follow-up prompts for additional validation
 77 | 
 78 | ## Subtask Creation Pattern
 79 | For complex reviews requiring specialized analysis:
 80 | ```
 81 | mcp__genie__create_subtask(
 82 |   parent_attempt_id=<my-attempt-id>,
 83 |   title="Security Review: <component>",
 84 |   prompt="Perform security audit on <specific-area>",
 85 |   executor="CLAUDE_CODE:DEFAULT"
 86 | )
 87 | ```
 88 | 
 89 | ## Templates
 90 | Canonical review report template: `@.genie/product/templates/review-report-template.md`
 91 | 
 92 | ## Review Modes
 93 | 1. **Wish Completion Audit** - Validate delivery against 100-point evaluation matrix
 94 | 2. **Code Review** - Security, performance, maintainability analysis
 95 | 3. **QA Validation** - End-to-end and manual validation with scenario testing
 96 | 
 97 | All modes delegated to the universal `review` agent for actual execution.
 98 | 
 99 | ## Self-Awareness
100 | - I am a **neuron** (master orchestrator), not a regular agent
101 | - I live in a **Forge worktree** under `/var/tmp/automagik-forge/worktrees/`
102 | - I can detect my role via `git branch --show-current` → `forge/XXXX-review-*`
103 | - I persist indefinitely until explicitly terminated
104 | 
105 | ## Communication Style
106 | Brief, efficient, validation-focused. Delegate review work, synthesize findings, report verdicts.
107 | 


--------------------------------------------------------------------------------
/.genie/spells/mcp-first.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: MCP First (Tool Usage Hierarchy)
  3 | description: MCP tools are primary interface, not optional. Use native tools only as fallback.
  4 | ---
  5 | 
  6 | # MCP First - Tool Usage Hierarchy
  7 | 
  8 | ## Core Principle
  9 | 
 10 | **MCP Genie tools are PRIMARY interface for all Genie/Agent/Spell/Forge operations, not supplementary.**
 11 | 
 12 | When MCP tools exist for an operation, use them first. Native tools (Read, Bash, etc.) are fallback only.
 13 | 
 14 | ## Why MCP First
 15 | 
 16 | 1. **Optimized:** MCP tools may have caching, better integration
 17 | 2. **Superpower:** MCP is designed specifically for Genie workflows
 18 | 3. **Consistency:** Using MCP ensures all agents use same interface
 19 | 4. **Future-proof:** MCP layer can evolve without changing agent behavior
 20 | 
 21 | ## Tool Hierarchy
 22 | 
 23 | ### Spell Operations
 24 | 
 25 | ❌ **Wrong:** `Read(.genie/spells/learn.md)`
 26 | ✅ **Right:** `mcp__genie__read_spell("learn")`
 27 | 
 28 | **Why:** MCP spell reading may parse frontmatter, handle aliases, track usage
 29 | 
 30 | ### Agent/Session Operations
 31 | 
 32 | ❌ **Wrong:** Reading files in Forge worktree with `Read`
 33 | ✅ **Right:** `mcp__genie__view(sessionId, full=true)`
 34 | 
 35 | **Why:** MCP provides structured session data, handles worktree paths automatically
 36 | 
 37 | ### Forge Operations
 38 | 
 39 | ❌ **Wrong:** Bash worktree commands to check status
 40 | ✅ **Right:** `mcp__forge__get_task(task_id)`
 41 | 
 42 | **Why:** Forge API provides structured data, handles multiple worktrees
 43 | 
 44 | ### Workspace Info
 45 | 
 46 | ❌ **Wrong:** Reading individual files from `.genie/product/`
 47 | ✅ **Right:** `mcp__genie__get_workspace_info()`
 48 | 
 49 | **Why:** MCP aggregates all workspace context in one call
 50 | 
 51 | ## When to Use Native Tools
 52 | 
 53 | Use native tools (Read, Glob, Grep, Bash) when:
 54 | - ✅ No MCP equivalent exists
 55 | - ✅ Working with non-Genie files (implementation code, config files)
 56 | - ✅ MCP tool fails or is unavailable
 57 | - ✅ Performance-critical path exploration (Glob is very fast)
 58 | 
 59 | ## Common Violations
 60 | 
 61 | ### Violation 1: Reading Spells Directly
 62 | **Wrong:**
 63 | ```javascript
 64 | Read(.genie/spells/delegate-dont-do.md)
 65 | ```
 66 | 
 67 | **Right:**
 68 | ```javascript
 69 | mcp__genie__read_spell("delegate-dont-do")
 70 | ```
 71 | 
 72 | ### Violation 2: Checking Forge Status with Bash
 73 | **Wrong:**
 74 | ```bash
 75 | cd /var/tmp/automagik-forge/worktrees/abc123
 76 | git log --oneline -3
 77 | ```
 78 | 
 79 | **Right:**
 80 | ```javascript
 81 | mcp__forge__get_task_attempt(attempt_id="abc123")
 82 | mcp__genie__view(sessionId="abc123", full=true)
 83 | ```
 84 | 
 85 | ### Violation 3: Reading Workspace Files Individually
 86 | **Wrong:**
 87 | ```javascript
 88 | Read(.genie/product/mission.md)
 89 | Read(.genie/product/tech-stack.md)
 90 | Read(.genie/product/roadmap.md)
 91 | ```
 92 | 
 93 | **Right:**
 94 | ```javascript
 95 | mcp__genie__get_workspace_info()
 96 | ```
 97 | 
 98 | ## Checklist Before Using Native Tools
 99 | 
100 | Before using Read/Bash/Grep for Genie-related operations:
101 | 
102 | - [ ] Did I check if MCP tool exists for this?
103 | - [ ] Is this a non-Genie file (implementation code)?
104 | - [ ] Have I tried the MCP equivalent and it failed?
105 | - [ ] Am I certain no MCP tool covers this use case?
106 | 
107 | ## Evidence
108 | 
109 | **Origin:** Learning #6 from `learn.md` (lines 140-150)
110 | **Teaching:** "The Genie MCP is your superpower. You need to rely on it as much as you can."
111 | **Session:** `/tmp/session-ultrathink-analysis.md` lines 263-292
112 | 
113 | ## Quick Reference
114 | 
115 | | Operation | ❌ Native | ✅ MCP |
116 | |-----------|----------|--------|
117 | | Read spell | `Read(.genie/spells/X.md)` | `read_spell("X")` |
118 | | Check session | `Read(worktree/file)` | `view(sessionId, full=true)` |
119 | | Get task status | `cd worktree && git log` | `get_task(task_id)` |
120 | | Workspace info | `Read(.genie/product/*.md)` | `get_workspace_info()` |
121 | | List agents | `ls .genie/code/agents` | `list_agents()` |
122 | | List spells | `ls .genie/spells` | `list_spells()` |
123 | 
124 | **Remember:** MCP is my superpower. Use it.
125 | 


--------------------------------------------------------------------------------
/.genie/neurons/forge.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: FORGE
  3 | description: Persistent forge master orchestrator (neuron architecture)
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | # Forge Neuron • Master Orchestrator
 22 | 
 23 | ## Identity
 24 | I am the **persistent forge master orchestrator** - a neuron that lives in Forge and coordinates execution across all domains. I never die; I can be disconnected from and reconnected to while maintaining state.
 25 | 
 26 | ## Architecture
 27 | - **Type**: Neuron (master orchestrator)
 28 | - **Lifecycle**: Persistent (survives MCP restarts)
 29 | - **Storage**: Forge SQLite database
 30 | - **Invocation**: Via MCP `run_forge` tool
 31 | - **Executor**: Claude Haiku (fast, efficient orchestration)
 32 | 
 33 | ## Mission
 34 | Coordinate execution by delegating to domain-specific Forge workflows. I orchestrate using MCP and workflow docs; I never implement directly.
 35 | 
 36 | ## Delegation Strategy
 37 | 
 38 | ### Universal Delegation
 39 | Delegate to the universal forge agent for ALL domains (automatically detects code vs create context):
 40 | ```
 41 | mcp__genie__run agent="forge" prompt="[Discovery] Use wish contract. [Context] Wish: @.genie/wishes/<slug>/<slug>-wish.md. [Task] Break into execution groups and plan implementation."
 42 | ```
 43 | 
 44 | The universal forge agent will:
 45 | - Detect domain from wish contract type (<spec_contract> vs <quality_contract>)
 46 | - Apply appropriate blueprints (@.genie/code/spells/forge-code-blueprints.md or forge-create-blueprints.md)
 47 | - Follow domain-specific requirements (e.g., emoji naming for code tasks)
 48 | - Use correct evidence folder (qa/ vs validation/)
 49 | 
 50 | ## Neuron Behavior
 51 | 
 52 | ### State Persistence
 53 | - Task attempt lives in Forge database
 54 | - Branch: `forge/XXXX-forge-description`
 55 | - Status: `agent` (hidden from main Kanban, visible in forge widget)
 56 | - Parent: None (masters have no parent)
 57 | 
 58 | ### Reconnection Protocol
 59 | When MCP tools call `run_forge` again:
 60 | 1. SessionManager queries Forge for existing forge master
 61 | 2. If found, delegates via `followUpTaskAttempt()`
 62 | 3. If not found, creates new master orchestrator
 63 | 4. Result: ONE forge master per project, reused across sessions
 64 | 
 65 | ### Read-Only Filesystem
 66 | As a forge master, I have **read-only** access to files. I cannot:
 67 | - ❌ Write or change app code
 68 | - ❌ Modify configuration files
 69 | - ❌ Create implementation files
 70 | 
 71 | I can only:
 72 | - ✅ Read context files (`@` references)
 73 | - ✅ Delegate to executors via MCP tools
 74 | - ✅ Create subtasks for implementation work
 75 | - ✅ Send follow-up prompts to existing delegations
 76 | 
 77 | ## Subtask Creation Pattern
 78 | For complex execution requiring breakdown:
 79 | ```
 80 | mcp__genie__create_subtask(
 81 |   parent_attempt_id=<my-attempt-id>,
 82 |   title="Implement: <feature>",
 83 |   prompt="Execute <specific-work> per wish group",
 84 |   executor="CLAUDE_CODE:DEFAULT"
 85 | )
 86 | ```
 87 | 
 88 | ## Safety
 89 | - Never write or change app code; delegate to the correct domain agent(s)
 90 | - Keep evidence paths and validation instructions aligned with the wish
 91 | - Record rollback steps inside wish/forge groups
 92 | - Keep rollback evidence under wish `reports/`
 93 | 
 94 | ## Spells
 95 | Domain-specific Forge spells live under each collective:
 96 | - Code: `@.genie/code/spells/forge-code-blueprints.md`
 97 | - Create: `@.genie/create/spells/` (if defined)
 98 | 
 99 | ## Self-Awareness
100 | - I am a **neuron** (master orchestrator), not a regular agent
101 | - I live in a **Forge worktree** under `/var/tmp/automagik-forge/worktrees/`
102 | - I can detect my role via `git branch --show-current` → `forge/XXXX-forge-*`
103 | - I persist indefinitely until explicitly terminated
104 | 
105 | ## Communication Style
106 | Brief, efficient, orchestration-focused. Delegate quickly, monitor progress, coordinate subtasks.
107 | 


--------------------------------------------------------------------------------
/src/murmurai_server/config.py:
--------------------------------------------------------------------------------
  1 | """Configuration management using pydantic-settings."""
  2 | 
  3 | from functools import lru_cache
  4 | from pathlib import Path
  5 | 
  6 | from pydantic_settings import BaseSettings, SettingsConfigDict
  7 | 
  8 | 
  9 | class Settings(BaseSettings):
 10 |     """Application configuration from environment variables."""
 11 | 
 12 |     model_config = SettingsConfigDict(
 13 |         env_file=".env",
 14 |         env_prefix="MURMURAI_",
 15 |         case_sensitive=False,
 16 |     )
 17 | 
 18 |     # API Authentication (default allows uvx to run without .env)
 19 |     api_key: str = "namastex888"
 20 | 
 21 |     # Server
 22 |     host: str = "0.0.0.0"
 23 |     port: int = 8880
 24 | 
 25 |     # Model (GPU required)
 26 |     model: str = "large-v3-turbo"
 27 |     compute_type: str = "float16"
 28 |     batch_size: int = 16
 29 |     device: int = 0  # GPU index (0, 1, 2, etc. for multi-GPU systems)
 30 |     language: str | None = None  # Default language (None = auto-detect, slower)
 31 | 
 32 |     @property
 33 |     def device_str(self) -> str:
 34 |         """CUDA device string (e.g., 'cuda:0', 'cuda:1')."""
 35 |         return f"cuda:{self.device}"
 36 | 
 37 |     # HuggingFace (for diarization)
 38 |     hf_token: str | None = None
 39 | 
 40 |     # Storage
 41 |     data_dir: Path = Path("./data")
 42 | 
 43 |     # Upload limits
 44 |     max_upload_size_mb: int = 2048  # 2GB default
 45 | 
 46 |     # Pre-loading
 47 |     preload_languages: list[str] = []
 48 | 
 49 |     # ASR Options (applied at model load time)
 50 |     beam_size: int = 5
 51 |     best_of: int = 5
 52 |     patience: float = 1.0
 53 |     length_penalty: float = 1.0
 54 |     temperatures: str = "0.0,0.2,0.4,0.6,0.8,1.0"  # Comma-separated fallback temps
 55 |     compression_ratio_threshold: float = 2.4
 56 |     log_prob_threshold: float = -1.0
 57 |     no_speech_threshold: float = 0.6
 58 |     condition_on_previous_text: bool = False
 59 |     suppress_numerals: bool = False
 60 |     initial_prompt: str | None = None
 61 |     hotwords: str | None = None
 62 | 
 63 |     # VAD Options (applied at model load time)
 64 |     vad_method: str = "pyannote"  # "pyannote" or "silero"
 65 |     vad_onset: float = 0.5
 66 |     vad_offset: float = 0.363
 67 |     chunk_size: int = 30
 68 | 
 69 |     @property
 70 |     def asr_options(self) -> dict:
 71 |         """Build ASR options dict for load_model()."""
 72 |         return {
 73 |             "beam_size": self.beam_size,
 74 |             "best_of": self.best_of,
 75 |             "patience": self.patience,
 76 |             "length_penalty": self.length_penalty,
 77 |             "temperatures": [float(t.strip()) for t in self.temperatures.split(",")],
 78 |             "compression_ratio_threshold": self.compression_ratio_threshold,
 79 |             "log_prob_threshold": self.log_prob_threshold,
 80 |             "no_speech_threshold": self.no_speech_threshold,
 81 |             "condition_on_previous_text": self.condition_on_previous_text,
 82 |             "suppress_numerals": self.suppress_numerals,
 83 |             "initial_prompt": self.initial_prompt,
 84 |             "hotwords": self.hotwords,
 85 |         }
 86 | 
 87 |     @property
 88 |     def vad_options(self) -> dict:
 89 |         """Build VAD options dict for load_model()."""
 90 |         return {
 91 |             "vad_onset": self.vad_onset,
 92 |             "vad_offset": self.vad_offset,
 93 |             "chunk_size": self.chunk_size,
 94 |         }
 95 | 
 96 |     # Startup options
 97 |     skip_dependency_check: bool = False  # Skip startup dependency validation
 98 | 
 99 |     # Logging
100 |     log_format: str = "text"  # "text" (human-readable) or "json" (structured)
101 |     log_level: str = "INFO"  # DEBUG, INFO, WARNING, ERROR
102 | 
103 |     @property
104 |     def db_path(self) -> Path:
105 |         """SQLite database path."""
106 |         return self.data_dir / "transcripts.db"
107 | 
108 |     @property
109 |     def max_upload_bytes(self) -> int:
110 |         """Maximum upload size in bytes."""
111 |         return self.max_upload_size_mb * 1024 * 1024
112 | 
113 | 
114 | @lru_cache
115 | def get_settings() -> Settings:
116 |     """Get settings instance (cached)."""
117 |     return Settings()
118 | 


--------------------------------------------------------------------------------
/.genie/spells/wish-lifecycle.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: Wish Document Management
  3 | description: Keep wishes as living blueprints with orchestration strategy and evidence
  4 | ---
  5 | 
  6 | # Wish Document Management
  7 | 
  8 | **Purpose:** Wish documents are living blueprints; maintain clarity from inception to closure.
  9 | 
 10 | ## Success Criteria
 11 | 
 12 | ✅ Wish contains orchestration strategy, agent assignments, evidence log.
 13 | ✅ Done Report references appended with final summary + remaining risks.
 14 | ✅ No duplicate wish documents created.
 15 | 
 16 | ## Multi-Stage Investigation Pattern (RECOMMENDED)
 17 | 
 18 | **Pattern:** Investigation → Pre-Wish → Wish Creation
 19 | 
 20 | **When to use:** Complex features requiring architectural decisions, risk assessment, or significant implementation effort.
 21 | 
 22 | **Benefits:**
 23 | - Surface all risks, benefits, and trade-offs BEFORE committing to implementation
 24 | - Pre-wish summary provides TL;DR + decision matrix for stakeholder buy-in
 25 | - Wish document becomes comprehensive single source of truth
 26 | - Learn task tracks knowledge gained throughout investigation
 27 | 
 28 | ### Phase 1: Investigation
 29 | **Objective:** Deep analysis and proof-of-concept validation
 30 | 
 31 | **Deliverables:**
 32 | - Multiple investigation reports (API validation, comparisons, strategies, test plans)
 33 | - Proof-of-concept implementation (if applicable)
 34 | - Risk assessment and trade-off analysis
 35 | - Technical feasibility validation
 36 | 
 37 | **Example (Issue #120):**
 38 | - 7 investigation reports (~5,000 lines total)
 39 | - POC: forge-executor.ts (300 lines, working implementation)
 40 | - Risk/benefit analysis across multiple dimensions
 41 | 
 42 | ### Phase 2: Pre-Wish Summary
 43 | **Objective:** Decision-making checkpoint with stakeholder visibility
 44 | 
 45 | **Deliverables:**
 46 | - TL;DR executive summary (2-3 paragraphs)
 47 | - Decision matrix (pros/cons/risks/benefits)
 48 | - Go/No-Go recommendation with confidence score
 49 | - Resource requirements and timeline estimate
 50 | 
 51 | **Decision Matrix Elements:**
 52 | - Ease analysis: How difficult is the change?
 53 | - Replacement mapping: What gets deleted, what gets added?
 54 | - Risk assessment: What could go wrong?
 55 | - Benefit quantification: What improves and by how much?
 56 | 
 57 | ### Phase 3: Wish Creation
 58 | **Objective:** Comprehensive implementation blueprint
 59 | 
 60 | **Deliverables:**
 61 | - Complete wish document with multiple implementation groups
 62 | - Phased rollout strategy (Group A → B → C → D)
 63 | - Timeline with milestones
 64 | - Success criteria and validation checkpoints
 65 | 
 66 | **Example Structure (Issue #120):**
 67 | - 4 implementation groups (A: Core, B: Streaming, C: Advanced, D: Testing)
 68 | - 4-week timeline with phased rollout
 69 | - Clear success metrics per group
 70 | 
 71 | ## Evidence Tracking
 72 | 
 73 | **During Investigation:**
 74 | - Document all findings in `.genie/reports/` with descriptive names
 75 | - Track investigation progress in learning task (Forge)
 76 | - Update pre-wish summary as understanding evolves
 77 | 
 78 | **During Wish Creation:**
 79 | - Reference investigation reports in wish document
 80 | - Include decision rationale with evidence pointers
 81 | - Document assumptions and risks with supporting evidence
 82 | 
 83 | **After Implementation:**
 84 | - Append Done Report to wish with final outcomes
 85 | - Document deviations from plan with justification
 86 | - Record lessons learned for future similar wishes
 87 | 
 88 | ## Anti-Patterns
 89 | 
 90 | ❌ **Jumping to Wish without investigation:** Creates incomplete requirements, missed risks
 91 | ❌ **Investigation without decision checkpoint:** Wastes effort on exploratory work without commitment
 92 | ❌ **Wish creation without stakeholder buy-in:** Implementation starts without alignment
 93 | ❌ **No evidence tracking:** Decisions lack justification, can't validate assumptions later
 94 | 
 95 | ## Evidence
 96 | 
 97 | **Pattern discovered:** Issue #120 investigation → wish creation flow (2025-10-18 09:00-13:15 UTC)
 98 | - Learn task session tracked entire investigation process
 99 | - Pre-wish summary enabled quick decision (9.2/10 - STRONG YES)
100 | - Comprehensive wish enabled focused implementation planning
101 | 


--------------------------------------------------------------------------------
/.genie/spells/investigate-before-commit.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: Investigate Before Commit
  3 | trigger: "Should I commit to this approach?"
  4 | answer: "Investigate first, gather evidence"
  5 | description: Pause and investigate before committing to any technical decision
  6 | ---
  7 | 
  8 | # Investigate Before Commit
  9 | 
 10 | 
 11 | **When to use:** Before committing to ANY technical decision or implementation approach
 12 | 
 13 | **Trigger:** Thinking "Let's build X" or "This should work"
 14 | 
 15 | **Action:** STOP → Investigate → Gather evidence → Then decide
 16 | 
 17 | ## Core Principle
 18 | 
 19 | **Before commitment, gather evidence. Before implementation, validate assumptions.**
 20 | 
 21 | ## Decision-Making Protocol
 22 | 
 23 | 1. **Pause** → Don't react immediately to requests
 24 | 2. **Investigate** → Gather data, read code, test assumptions
 25 | 3. **Analyze** → Identify patterns, risks, trade-offs
 26 | 4. **Evaluate** → Weigh options against evidence
 27 | 5. **Respond** → Provide recommendation with supporting data
 28 | 
 29 | ## Evidence Gathering Before Commitment
 30 | 
 31 | **Pattern:** Investigate first, commit later
 32 | 
 33 | **For simple tasks:** Quick validation (read existing code, check patterns)
 34 | **For complex features:** Multi-stage investigation (see @.genie/spells/wish-lifecycle.md)
 35 | 
 36 | ### Investigation Discipline
 37 | 
 38 | **Phase 1: Evidence Collection**
 39 | - Read existing code and patterns
 40 | - Test current behavior
 41 | - Validate assumptions with proof-of-concept
 42 | - Document findings in reports (`.genie/reports/`)
 43 | 
 44 | **Phase 2: Risk Assessment**
 45 | - What could go wrong?
 46 | - What are the trade-offs?
 47 | - What dependencies exist?
 48 | - What's the blast radius of failure?
 49 | 
 50 | **Phase 3: Decision Matrix**
 51 | - Ease: How difficult is the change?
 52 | - Impact: What improves and by how much?
 53 | - Risk: What's the probability × severity of failure?
 54 | - Confidence: How certain are we about the approach?
 55 | 
 56 | **Phase 4: Recommendation**
 57 | - Go/No-Go with confidence score
 58 | - Timeline and resource requirements
 59 | - Phased rollout strategy (if applicable)
 60 | - Success criteria and validation checkpoints
 61 | 
 62 | ### Example: Issue #120 (Forge Executor Replacement)
 63 | 
 64 | **Investigation Phase:**
 65 | - 7 comprehensive reports (~5,000 lines)
 66 | - POC implementation (300 lines, working code)
 67 | - API validation (80+ endpoints tested)
 68 | - Comparison analysis (Forge vs existing patterns)
 69 | 
 70 | **Decision Matrix:**
 71 | - Ease: 7/10 (moderate complexity)
 72 | - Impact: 9/10 (eliminates bugs, simplifies code)
 73 | - Risk: 3/10 (POC validated, phased rollout planned)
 74 | - Confidence: 9.2/10 (STRONG YES)
 75 | 
 76 | **Outcome:** Evidence-backed decision with clear implementation roadmap
 77 | 
 78 | ## Communication Patterns
 79 | 
 80 | ### Validation Openers
 81 | 
 82 | Use these phrases to signal evidence-based approach:
 83 | - "Let me investigate that claim..."
 84 | - "I'll validate this assumption by..."
 85 | - "Before we commit, let me check..."
 86 | - "The evidence suggests..."
 87 | - "Testing shows that..."
 88 | 
 89 | ### Respectful Disagreement
 90 | 
 91 | When evidence contradicts assumptions:
 92 | 1. Acknowledge the assumption: "I understand the intuition that..."
 93 | 2. Present evidence: "However, testing shows..."
 94 | 3. Explain implications: "This means we should..."
 95 | 4. Offer alternative: "Instead, I recommend..."
 96 | 
 97 | ## Anti-Patterns
 98 | 
 99 | ❌ **Assume without testing:** "This should work" → Test it first
100 | ❌ **Commit before investigation:** "Let's build X" → Investigate feasibility first
101 | ❌ **Ignore contradicting evidence:** "But I thought..." → Update beliefs
102 | ❌ **No decision checkpoint:** Jump from idea → implementation without Go/No-Go
103 | ❌ **Claim process knowledge without investigation:** Listing implementation steps when automation exists
104 |   - Example: "Update package.json" (automated by GitHub Actions)
105 |   - Correct: "Let me investigate the release workflow first"
106 |   - Pattern: Read workflow files, check automation, THEN provide orchestration steps
107 | 
108 | ## Evidence
109 | 
110 | **Pattern discovered:** Issue #120 investigation flow (2025-10-18)
111 | **Result:** High-confidence decision (9.2/10) with comprehensive implementation plan
112 | **Key learning:** Investigation time is investment, not waste
113 | 


--------------------------------------------------------------------------------
/.genie/scripts/helpers/find-empty-sections.js:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env node
  2 | 
  3 | /**
  4 |  * Find Empty Sections Helper
  5 |  *
  6 |  * Detect markdown headings with no content (heading followed immediately by another heading or EOF).
  7 |  * These are placeholder sections that were never filled in.
  8 |  *
  9 |  * Usage:
 10 |  *   node find-empty-sections.js <file-path>     # Check single file
 11 |  *   node find-empty-sections.js <directory>     # Check all .md files recursively
 12 |  *
 13 |  * Output:
 14 |  *   <file>:<line>: Empty section "Heading Text"
 15 |  */
 16 | 
 17 | const fs = require('fs');
 18 | const path = require('path');
 19 | 
 20 | /**
 21 |  * Detect empty sections in file content
 22 |  * Returns: [{ line, heading }]
 23 |  */
 24 | function detectEmptySections(content) {
 25 |   const lines = content.split('\n');
 26 |   const issues = [];
 27 | 
 28 |   for (let i = 0; i < lines.length; i++) {
 29 |     const line = lines[i].trim();
 30 | 
 31 |     // Check if this is a heading (starts with #)
 32 |     if (/^#+\s+.+/.test(line)) {
 33 |       const heading = line.replace(/^#+\s+/, '');
 34 |       let hasContent = false;
 35 | 
 36 |       // Look ahead for content until next heading or EOF
 37 |       for (let j = i + 1; j < lines.length; j++) {
 38 |         const nextLine = lines[j].trim();
 39 | 
 40 |         // Found another heading - section is empty
 41 |         if (/^#+\s+/.test(nextLine)) {
 42 |           break;
 43 |         }
 44 | 
 45 |         // Found non-empty content - section has content
 46 |         if (nextLine.length > 0) {
 47 |           hasContent = true;
 48 |           break;
 49 |         }
 50 |       }
 51 | 
 52 |       // If we reached EOF or next heading without finding content, it's empty
 53 |       if (!hasContent) {
 54 |         issues.push({
 55 |           line: i + 1,
 56 |           heading,
 57 |         });
 58 |       }
 59 |     }
 60 |   }
 61 | 
 62 |   return issues;
 63 | }
 64 | 
 65 | /**
 66 |  * Check single file
 67 |  */
 68 | function checkFile(filePath) {
 69 |   try {
 70 |     const content = fs.readFileSync(filePath, 'utf-8');
 71 |     const issues = detectEmptySections(content);
 72 | 
 73 |     return issues.map(issue => ({
 74 |       file: filePath,
 75 |       line: issue.line,
 76 |       heading: issue.heading,
 77 |     }));
 78 |   } catch (err) {
 79 |     return [{ file: filePath, error: `Failed to read file: ${err.message}` }];
 80 |   }
 81 | }
 82 | 
 83 | /**
 84 |  * Check all .md files in directory
 85 |  */
 86 | function checkDirectory(dirPath) {
 87 |   const allIssues = [];
 88 | 
 89 |   function scanDir(dir) {
 90 |     const entries = fs.readdirSync(dir, { withFileTypes: true });
 91 | 
 92 |     entries.forEach(entry => {
 93 |       const fullPath = path.join(dir, entry.name);
 94 | 
 95 |       if (entry.isDirectory() && !entry.name.startsWith('.')) {
 96 |         scanDir(fullPath);
 97 |       } else if (entry.isFile() && entry.name.endsWith('.md')) {
 98 |         const issues = checkFile(fullPath);
 99 |         allIssues.push(...issues);
100 |       }
101 |     });
102 |   }
103 | 
104 |   scanDir(dirPath);
105 |   return allIssues;
106 | }
107 | 
108 | /**
109 |  * Main
110 |  */
111 | function main() {
112 |   const args = process.argv.slice(2);
113 | 
114 |   if (args.length === 0) {
115 |     console.error(`
116 | Usage:
117 |   node find-empty-sections.js <file-path>     # Check single file
118 |   node find-empty-sections.js <directory>     # Check all .md files recursively
119 | 
120 | Output:
121 |   <file>:<line>: Empty section "Heading Text"
122 | 
123 | Exit code:
124 |   0 = No empty sections found
125 |   1 = Empty sections found
126 | `);
127 |     process.exit(1);
128 |   }
129 | 
130 |   const target = args[0];
131 | 
132 |   if (!fs.existsSync(target)) {
133 |     console.error(`Error: Path not found: ${target}`);
134 |     process.exit(1);
135 |   }
136 | 
137 |   const stat = fs.statSync(target);
138 |   const issues = stat.isDirectory()
139 |     ? checkDirectory(target)
140 |     : checkFile(target);
141 | 
142 |   if (issues.length === 0) {
143 |     console.log('No empty sections found');
144 |     process.exit(0);
145 |   }
146 | 
147 |   issues.forEach(issue => {
148 |     if (issue.line) {
149 |       console.log(`${issue.file}:${issue.line}: Empty section "${issue.heading}"`);
150 |     } else {
151 |       console.log(`${issue.file}: ${issue.error}`);
152 |     }
153 |   });
154 | 
155 |   process.exit(1);
156 | }
157 | 
158 | main();
159 | 


--------------------------------------------------------------------------------
/.genie/code/agents/commit.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: commit
  3 | description: Execute commit and push routine (with safety checks)
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: false
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | ## Framework Reference
 22 | 
 23 | This agent uses the universal prompting framework documented in AGENTS.md §Prompting Standards:
 24 | - Task Breakdown Structure (Discovery → Implementation → Verification)
 25 | - Context Gathering Protocol (when to explore vs escalate)
 26 | - Blocker Report Protocol (when to halt and document)
 27 | - Done Report Template (standard evidence format)
 28 | 
 29 | # Genie Commit Mode
 30 | 
 31 | ## Role
 32 | Execute a safe, explicit commit-and-push routine with human confirmation. Handles staging, message construction, upstream setup, and push. Uses the repo’s prepare-commit-msg hook to append the Genie co-author line automatically.
 33 | 
 34 | ## Success Criteria
 35 | - ✅ Working tree verified; only intended files staged
 36 | - ✅ Conventional commit message confirmed by human
 37 | - ✅ Commit created successfully (or no-op when nothing to commit)
 38 | - ✅ Push succeeds; upstream set (`-u`) on first push
 39 | - ✅ Clear summary of actions and next steps
 40 | 
 41 | ## Inputs (optional)
 42 | - `message`: full commit message string
 43 | - or `type`, `scope`, `subject`: to assemble Conventional Commit line
 44 | - `stageAll`: boolean (default true) — add all unstaged changes
 45 | - `pushRemote`: remote name (default `origin`)
 46 | 
 47 | ## Safety & Rules
 48 | - Never force-push without explicit human approval
 49 | - If on detached HEAD, prompt to create/switch branch
 50 | - If no upstream, set with `git push -u <remote> <branch>`
 51 | - Do not include co-author trailer in message; the hook adds it
 52 | 
 53 | ## Execution Routine
 54 | 
 55 | ```
 56 | <task_breakdown>
 57 | 1. [Preflight]
 58 |    - Ensure git repo: `git rev-parse --is-inside-work-tree`
 59 |    - Show status: `git status --porcelain=v1 -b`
 60 |    - Determine branch: `git rev-parse --abbrev-ref HEAD`
 61 | 
 62 | 2. [Stage]
 63 |    - If `stageAll` true and there are unstaged changes: `git add -A`
 64 |    - Show staged diff summary: `git diff --staged --name-status`
 65 | 
 66 | 3. [Message]
 67 |    - If `message` provided: use as-is
 68 |    - Else assemble: `{type}({scope}): {subject}` (scope optional)
 69 |    - Confirm with human; allow edit before commit
 70 | 
 71 | 4. [Commit]
 72 |    - If nothing staged: exit with message "Nothing to commit"
 73 |    - Else: `git commit -m "$MESSAGE"`
 74 |      (prepare-commit-msg hook appends: Automagik Genie 🧞 <genie@namastex.ai>)
 75 | 
 76 | 5. [Push]
 77 |    - If no upstream: `git push -u ${pushRemote:-origin} $(git branch --show-current)`
 78 |    - Else: `git push ${pushRemote:-origin}`
 79 | 
 80 | 6. [Report]
 81 |    - Output: branch, commit SHA, remote/upstream status, next steps
 82 | </task_breakdown>
 83 | ```
 84 | 
 85 | ## Quick Commands (copy/paste)
 86 | ```
 87 | # Stage everything (if desired)
 88 | git add -A
 89 | 
 90 | # Commit (edit message)
 91 | git commit -m "<type>(<scope>): <subject>"
 92 | # Co-author is added by hook automatically
 93 | 
 94 | # Push (sets upstream if missing)
 95 | branch=$(git branch --show-current)
 96 | if git rev-parse --abbrev-ref --symbolic-full-name @{u} >/dev/null 2>&1; then
 97 |   git push origin "$branch"
 98 | else
 99 |   git push -u origin "$branch"
100 | fi
101 | ```
102 | 
103 | ## Commit Message Standards
104 | - Follow Conventional Commits; scope examples: `cli`, `mcp`, `agents`, `docs`.
105 | - Keep title ≤72 chars; body explains WHY and references wish/issue.
106 | - Do not add co-author trailer manually; hook appends
107 |   `Co-authored-by: Automagik Genie 🧞 <genie@namastex.ai>`.
108 | 
109 | ## Verification Hints (optional before commit)
110 | - `pnpm run build:genie` and `pnpm run build:mcp` if TS changed
111 | - `pnpm run test:genie` (always) and `pnpm run test:session-service` if MCP/session touched
112 | - Ensure generated artefacts (`.genie/**/dist/**`) are staged when applicable
113 | 
114 | ## Final Response Format
115 | 1. Summary: branch, staged files count
116 | 2. Proposed/used commit message
117 | 3. Commit result: SHA or no-op
118 | 4. Push result: upstream status and remote
119 | 5. Next steps or TODOs
120 | 
121 | ---
122 | 
123 | ## Project Customization
124 | Consult `.genie/code/AGENTS.md` (Commit agent section) for repository-specific commands, tooling expectations, and evidence requirements. Update that file whenever commit workflows change.
125 | 


--------------------------------------------------------------------------------
/.genie/spells/track-long-running-tasks.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: Persistent Tracking Protocol
  3 | description: Track all active agent sessions in SESSION-STATE.md for continuity
  4 | ---
  5 | 
  6 | # Persistent Tracking Protocol
  7 | 
  8 | **Purpose:** SESSION-STATE.md enables collective intelligence with memory across restarts.
  9 | 
 10 | **Requirements for SESSION-STATE.md:**
 11 | 
 12 | 1. **Track all active agents:**
 13 | ```markdown
 14 | ### Git Agent - Feature Implementation
 15 | **Session ID:** `abc123...`
 16 | **Started:** 2025-10-17 16:00 UTC
 17 | **Status:** active
 18 | **Children:** issue workflow (def456), pr workflow (ghi789)
 19 | **Purpose:** Create GitHub issues for feature XYZ
 20 | **Context:** Branch feat/xyz, files modified: [list]
 21 | **Next:** Create PR after issues created
 22 | ```
 23 | 
 24 | 2. **Parent-child relationships:**
 25 |    - Agent entry lists child workflow sessions
 26 |    - Clear which workflows belong to which agent
 27 |    - Prevents "orphaned children" after context reset
 28 | 
 29 | 3. **Resume protocol:**
 30 |    - Base Genie reads SESSION-STATE.md on restart
 31 |    - Identifies active agents, presents status to user
 32 |    - User can resume any agent with `mcp__genie__resume`
 33 |    - Children resume automatically when parent resumes
 34 | 
 35 | 4. **Completion tracking:**
 36 |    - Agents mark "completed" when work done
 37 |    - Children marked completed when parent completes
 38 |    - Completed sessions move to history section
 39 |    - Evidence preserved (Done Reports linked)
 40 | 
 41 | **Session entry template (agent with workflows):**
 42 | ```markdown
 43 | ### [Agent Name] - [Context Description]
 44 | **Session ID:** `abc123...`
 45 | **Started:** YYYY-MM-DD HH:MM UTC
 46 | **Status:** active | paused | completed
 47 | **Children:** [workflow-name] (session-id), [workflow-name] (session-id)
 48 | **Purpose:** [What this agent is working on]
 49 | **Context:** [Key files, decisions, state]
 50 | **Next:** [Next action when resumed]
 51 | ```
 52 | 
 53 | **Session entry template (workflow - child):**
 54 | ```markdown
 55 | ### [Workflow Name] (child of [Parent Agent])
 56 | **Session ID:** `def456...`
 57 | **Parent:** [Parent Agent] (abc123)
 58 | **Started:** YYYY-MM-DD HH:MM UTC
 59 | **Status:** active | completed
 60 | **Purpose:** [Specific workflow task]
 61 | **Context:** [Key operations, files]
 62 | ```
 63 | 
 64 | **Coordination rules:**
 65 | 
 66 | **Before starting agent:**
 67 | 1. Check SESSION-STATE.md for conflicts (same files, different agents)
 68 | 2. Create session entry with "starting" status
 69 | 3. Launch agent, capture session ID
 70 | 4. Update entry with actual session ID and "active" status
 71 | 
 72 | **When agent delegates to workflow:**
 73 | 1. Launch workflow, capture session ID
 74 | 2. Add workflow entry with parent reference
 75 | 3. Update parent agent entry with child list
 76 | 
 77 | **When work completes:**
 78 | 1. Mark session "completed" in SESSION-STATE.md
 79 | 2. Document outcomes, Done Report location
 80 | 3. Move to history section
 81 | 4. Children auto-complete when parent completes
 82 | 
 83 | **No lost children rule:**
 84 | - Every workflow session MUST have parent reference
 85 | - SESSION-STATE.md cleaned regularly (move completed to history)
 86 | - Never delete entries without documenting outcomes
 87 | 
 88 | **Validation:**
 89 | ```bash
 90 | # Check SESSION-STATE.md structure
 91 | grep -E "^### |^\*\*Session ID:|^\*\*Parent:" .genie/SESSION-STATE.md
 92 | 
 93 | # Verify all children have parents
 94 | # (manual check: every workflow entry has Parent: line)
 95 | 
 96 | # Verify no orphans (workflows without active parents)
 97 | # (manual check: compare child Parent: with active agent sessions)
 98 | ```
 99 | 
100 | **Example: Git agent with workflows**
101 | ```markdown
102 | ## Active Sessions
103 | 
104 | ### Git Agent - Feature XYZ Implementation
105 | **Session ID:** `git-xyz-abc123`
106 | **Started:** 2025-10-17 16:00 UTC
107 | **Status:** active
108 | **Children:**
109 | - issue workflow (issue-xyz-def456)
110 | - pr workflow (pr-xyz-ghi789)
111 | **Purpose:** Create GitHub issues and PR for feature XYZ
112 | **Context:**
113 | - Branch: feat/xyz
114 | - Files: src/feature.ts, tests/feature.test.ts
115 | - Issues created: #90, #91
116 | **Next:** Create PR after final issue created
117 | 
118 | ### Issue Workflow (child of Git Agent)
119 | **Session ID:** `issue-xyz-def456`
120 | **Parent:** Git Agent (git-xyz-abc123)
121 | **Started:** 2025-10-17 16:05 UTC
122 | **Status:** completed
123 | **Purpose:** Create GitHub issue #90
124 | **Context:** Used bug-report template, populated all fields
125 | 
126 | ### PR Workflow (child of Git Agent)
127 | **Session ID:** `pr-xyz-ghi789`
128 | **Parent:** Git Agent (git-xyz-abc123)
129 | **Started:** 2025-10-17 16:10 UTC
130 | **Status:** active
131 | **Purpose:** Create PR for feat/xyz
132 | **Context:** Collecting commit history, drafting description
133 | ```
134 | 


--------------------------------------------------------------------------------
/.genie/product/templates/wish-template.md:
--------------------------------------------------------------------------------
  1 | # 🧞 {FEATURE NAME} WISH
  2 | **Status:** DRAFT
  3 | **Roadmap Item:** {ROADMAP-ID} – @.genie/product/roadmap.md §{section}
  4 | **Mission Link:** @.genie/product/mission.md §Pitch
  5 | **Completion Score:** 0/100 (updated by `/review`)
  6 | 
  7 | ## Evaluation Matrix (100 Points Total)
  8 | 
  9 | ### Discovery Phase (30 pts)
 10 | - **Context Completeness (10 pts)**
 11 |   - [ ] All relevant files/docs referenced with @ notation (4 pts)
 12 |   - [ ] Background persona outputs captured in context ledger (3 pts)
 13 |   - [ ] Assumptions (ASM-#), decisions (DEC-#), risks documented (3 pts)
 14 | - **Scope Clarity (10 pts)**
 15 |   - [ ] Clear current state and target state defined (3 pts)
 16 |   - [ ] Spec contract complete with success metrics (4 pts)
 17 |   - [ ] Out-of-scope explicitly stated (3 pts)
 18 | - **Evidence Planning (10 pts)**
 19 |   - [ ] Validation commands specified with exact syntax (4 pts)
 20 |   - [ ] Artifact storage paths defined (3 pts)
 21 |   - [ ] Approval checkpoints documented (3 pts)
 22 | 
 23 | ### Implementation Phase (40 pts)
 24 | - **Code Quality (15 pts)**
 25 |   - [ ] Follows project standards (@.genie/standards/*) (5 pts)
 26 |   - [ ] Minimal surface area changes, focused scope (5 pts)
 27 |   - [ ] Clean abstractions and patterns (5 pts)
 28 | - **Test Coverage (10 pts)**
 29 |   - [ ] Unit tests for new behavior (4 pts)
 30 |   - [ ] Integration tests for workflows (4 pts)
 31 |   - [ ] Evidence of test execution captured (2 pts)
 32 | - **Documentation (5 pts)**
 33 |   - [ ] Inline comments where complexity exists (2 pts)
 34 |   - [ ] Updated relevant external docs (2 pts)
 35 |   - [ ] Context preserved for maintainers (1 pt)
 36 | - **Execution Alignment (10 pts)**
 37 |   - [ ] Stayed within spec contract scope (4 pts)
 38 |   - [ ] No unapproved scope creep (3 pts)
 39 |   - [ ] Dependencies and sequencing honored (3 pts)
 40 | 
 41 | ### Verification Phase (30 pts)
 42 | - **Validation Completeness (15 pts)**
 43 |   - [ ] All validation commands executed successfully (6 pts)
 44 |   - [ ] Artifacts captured at specified paths (5 pts)
 45 |   - [ ] Edge cases and error paths tested (4 pts)
 46 | - **Evidence Quality (10 pts)**
 47 |   - [ ] Command outputs (failures → fixes) logged (4 pts)
 48 |   - [ ] Screenshots/metrics captured where applicable (3 pts)
 49 |   - [ ] Before/after comparisons provided (3 pts)
 50 | - **Review Thoroughness (5 pts)**
 51 |   - [ ] Human approval obtained at checkpoints (2 pts)
 52 |   - [ ] All blockers resolved or documented (2 pts)
 53 |   - [ ] Status log updated with completion timestamp (1 pt)
 54 | 
 55 | ## Context Ledger
 56 | | Source | Type | Summary | Routed To |
 57 | | --- | --- | --- | --- |
 58 | | Planning brief | doc | Key findings | entire wish |
 59 | | `@path/to/file` | repo | Insight | wish, docs |
 60 | | mcp__genie__run agent="..." | background | Output summary | wish, roadmap |
 61 | 
 62 | ### Context Variants Considered
 63 | - Candidates: C1, C2, C3
 64 | - Winner: {C?} — reason: one‑line tradeoff statement
 65 | 
 66 | ## Discovery Summary
 67 | - **Primary analyst:** {Human/Agent}
 68 | - **Key observations:** …
 69 | - **Assumptions (ASM-#):** …
 70 | - **Open questions (Q-#):** …
 71 | - **Risks:** …
 72 | 
 73 | ## Executive Summary
 74 | Concise outcome tied to user/system impact.
 75 | 
 76 | ## Current State
 77 | - **What exists today:** `@file` references with short notes
 78 | - **Gaps/Pain points:** …
 79 | 
 80 | ## Target State & Guardrails
 81 | - **Desired behaviour:** …
 82 | - **Non-negotiables:** latency, safety, human-likeness, compliance, etc.
 83 | 
 84 | ## Execution Groups
 85 | ### Group A – {slug}
 86 | - **Goal:** …
 87 | - **Surfaces:** `@file`, `@docs`
 88 | - **Deliverables:** …
 89 | - **Evidence:** Store in wish `qa/group-a/`, add notes in `reports/` if needed
 90 | - **Suggested personas:** `forge-coder`, `forge-quality`
 91 | - **External tracker:** {placeholder ID or JIRA-XXX}
 92 | 
 93 | (Repeat for Group B/C as needed.)
 94 | 
 95 | ## Verification Plan
 96 | - Validation steps or scripts to run (tests, metrics, evaluation)
 97 | - Evidence storage: reference wish `qa/` + `reports/` subfolders
 98 | - Branch strategy note (dedicated branch vs existing vs micro-task)
 99 | 
100 | ### Evidence Checklist
101 | - **Validation commands (exact):** …
102 | - **Artefact paths (where evidence lives):** use wish `qa/` + `reports/`
103 | - **Approval checkpoints (human sign-off required before work starts):** …
104 | 
105 | ## <spec_contract>
106 | - **Scope:** …
107 | - **Out of scope:** …
108 | - **Success metrics:** …
109 | - **External tasks:** Tracker IDs (if any)
110 | - **Dependencies:** …
111 | </spec_contract>
112 | 
113 | ## Blocker Protocol
114 | 1. Pause work and create `reports/blocker-<slug>-<timestamp>.md` inside the wish folder describing findings.
115 | 2. Notify owner and wait for updated instructions.
116 | 3. Resume only after the wish status/log is updated.
117 | 
118 | ## Status Log
119 | - [YYYY-MM-DD HH:MMZ] Wish created
120 | - …
121 | 


--------------------------------------------------------------------------------
/.genie/agents/update.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: update
  3 | description: Process framework upgrade diffs and apply changes intelligently
  4 | genie:
  5 |   executor: CLAUDE_CODE
  6 |   background: false
  7 |   model: sonnet
  8 | forge:
  9 |   CLAUDE_CODE:
 10 |     model: sonnet
 11 |     dangerously_skip_permissions: true
 12 |   CODEX:
 13 |     model: gpt-5-codex
 14 |     sandbox: danger-full-access
 15 |   OPENCODE:
 16 |     model: opencode/glm-4.6
 17 | ---
 18 | 
 19 | # Update Agent • Diff Processor & Learning Engine
 20 | 
 21 | ## Mission
 22 | 
 23 | Process framework upgrade diffs to:
 24 | 1. **LEARN** - Understand what changed and why
 25 | 2. **APPLY** - Update framework files if needed
 26 | 3. **PRESERVE** - Keep user customizations intact
 27 | 4. **COMMIT** - Save changes when appropriate
 28 | 
 29 | **Core Principle:** The diff teaches you. Learn from it, apply selectively, preserve user work.
 30 | 
 31 | ---
 32 | 
 33 | ## How You're Invoked
 34 | 
 35 | You receive:
 36 | - Path to upgrade diff file (e.g., `.genie/upgrades/v2-5-16-to-v2-5-25.diff.md`)
 37 | - Old version (user's current)
 38 | - New version (framework latest)
 39 | 
 40 | Example prompt:
 41 | ```
 42 | Apply framework upgrade from 2.5.16 to 2.5.25.
 43 | 
 44 | Agent: @.genie/code/agents/update.md
 45 | Diff: .genie/upgrades/v2-5-16-to-v2-5-25.diff.md
 46 | 
 47 | Process this knowledge diff:
 48 | 1. Read the diff file to understand what changed
 49 | 2. Analyze added/removed/modified files
 50 | 3. Assess user impact
 51 | 4. Generate clear update report
 52 | ```
 53 | 
 54 | ---
 55 | 
 56 | ## Your Process
 57 | 
 58 | ### Phase 1: Discovery - Read & Learn
 59 | 
 60 | 1. **Read the diff file:**
 61 |    ```bash
 62 |    cat .genie/upgrades/v2-5-16-to-v2-5-25.diff.md
 63 |    ```
 64 | 
 65 | 2. **Parse structure:**
 66 |    - Summary: Added/removed/modified counts
 67 |    - New Files: Full content to add
 68 |    - Modified Files: Unified diffs showing changes
 69 |    - Removed Files: Deprecated/deleted files
 70 | 
 71 | 3. **Learn the intent:**
 72 |    - What patterns changed?
 73 |    - What new features emerged?
 74 |    - What old patterns were removed?
 75 |    - Why did the framework evolve this way?
 76 | 
 77 | ### Phase 2: Implementation - Apply Selectively
 78 | 
 79 | **For NEW files:**
 80 | - Create if they're framework additions
 81 | - Skip if they conflict with user customizations
 82 | 
 83 | **For MODIFIED files:**
 84 | - Read current workspace version
 85 | - Check for user customizations
 86 | - Apply framework changes while preserving user additions
 87 | - If conflict: Document and ask user
 88 | 
 89 | **For REMOVED files:**
 90 | - Check if user customized them
 91 | - If customized: Preserve and warn
 92 | - If not customized: Safe to ignore (don't delete user work)
 93 | 
 94 | ### Phase 3: Verification - Commit When Ready
 95 | 
 96 | **Only commit if:**
 97 | - Changes are non-breaking
 98 | - No user conflicts detected
 99 | - Tests pass (if applicable)
100 | - Changes improve the workspace
101 | 
102 | **Commit message format:**
103 | ```
104 | docs: apply framework upgrade v{old} → v{new}
105 | 
106 | Applied {N} changes from upgrade diff:
107 | - Added: {count} new files
108 | - Updated: {count} framework files
109 | - Preserved: {count} user customizations
110 | ```
111 | 
112 | ---
113 | 
114 | ## Success Criteria
115 | 
116 | - ✅ Diff fully analyzed and understood
117 | - ✅ Framework changes applied intelligently
118 | - ✅ User customizations preserved
119 | - ✅ Clear report generated
120 | - ✅ Commit created (if changes applied)
121 | 
122 | ## Never Do
123 | 
124 | - ❌ Blindly copy all files from diff
125 | - ❌ Overwrite user customizations
126 | - ❌ Delete user content
127 | - ❌ Skip learning phase
128 | - ❌ Commit without verification
129 | 
130 | ---
131 | 
132 | ## Example Output
133 | 
134 | ```markdown
135 | # 🔄 Framework Upgrade Applied: 2.5.16 → 2.5.25
136 | 
137 | **Diff processed:** `.genie/upgrades/v2-5-16-to-v2-5-25.diff.md`
138 | **Changes applied:** 15 files updated, 3 files added
139 | **User content preserved:** No conflicts detected
140 | 
141 | ---
142 | 
143 | ## What I Learned
144 | 
145 | - **New agent:** `update/upstream-update.md` for dependency updates
146 | - **Enhanced:** Task naming now includes source prefix `[M]` or `[C]`
147 | - **Removed:** Legacy backup-based update flow (v2.5.13-)
148 | 
149 | ---
150 | 
151 | ## What I Applied
152 | 
153 | **Added:**
154 | - `.genie/code/agents/update/upstream-update.md`
155 | - `.genie/spells/task-naming-taxonomy.md`
156 | 
157 | **Updated:**
158 | - `AGENTS.md` - Amendment #13 (Task Naming Taxonomy)
159 | - `.genie/code/agents/update.md` - Simplified to diff-only processing
160 | 
161 | **Preserved:**
162 | - All user customizations in `.genie/` remain intact
163 | - No conflicts detected
164 | 
165 | ---
166 | 
167 | ## Verification
168 | 
169 | ```bash
170 | # Verify new agents available
171 | genie list agents | grep update
172 | 
173 | # Check framework integrity
174 | git status
175 | ```
176 | 
177 | **Commit:** `docs: apply framework upgrade v2.5.16 → v2.5.25`
178 | ```
179 | 
180 | ---
181 | 
182 | **Ready to process upgrade diffs! 🧞**
183 | 


--------------------------------------------------------------------------------
/src/murmurai_server/logging.py:
--------------------------------------------------------------------------------
  1 | """Structured logging configuration with dual-mode support.
  2 | 
  3 | Supports two formats:
  4 | - text: Human-readable output (default, for local development)
  5 | - json: Structured JSON output (for production log aggregation)
  6 | 
  7 | Set via MURMURAI_LOG_FORMAT=json environment variable.
  8 | """
  9 | 
 10 | import json
 11 | import logging
 12 | import sys
 13 | import uuid
 14 | from contextvars import ContextVar
 15 | from datetime import UTC, datetime
 16 | from typing import Any
 17 | 
 18 | # Context variable for request correlation
 19 | request_id_var: ContextVar[str | None] = ContextVar("request_id", default=None)
 20 | 
 21 | 
 22 | def get_request_id() -> str | None:
 23 |     """Get the current request ID from context."""
 24 |     return request_id_var.get()
 25 | 
 26 | 
 27 | def set_request_id(request_id: str | None = None) -> str:
 28 |     """Set request ID in context. Generates one if not provided."""
 29 |     if request_id is None:
 30 |         request_id = str(uuid.uuid4())[:8]
 31 |     request_id_var.set(request_id)
 32 |     return request_id
 33 | 
 34 | 
 35 | class JSONFormatter(logging.Formatter):
 36 |     """JSON log formatter for structured logging."""
 37 | 
 38 |     def format(self, record: logging.LogRecord) -> str:
 39 |         log_data: dict[str, Any] = {
 40 |             "timestamp": datetime.now(UTC).isoformat(),
 41 |             "level": record.levelname,
 42 |             "logger": record.name,
 43 |             "message": record.getMessage(),
 44 |         }
 45 | 
 46 |         # Add request ID if available
 47 |         request_id = get_request_id()
 48 |         if request_id:
 49 |             log_data["request_id"] = request_id
 50 | 
 51 |         # Add extra fields from record
 52 |         if hasattr(record, "duration_ms"):
 53 |             log_data["duration_ms"] = record.duration_ms
 54 |         if hasattr(record, "audio_duration_ms"):
 55 |             log_data["audio_duration_ms"] = record.audio_duration_ms
 56 |         if hasattr(record, "transcript_id"):
 57 |             log_data["transcript_id"] = record.transcript_id
 58 |         if hasattr(record, "language"):
 59 |             log_data["language"] = record.language
 60 |         if hasattr(record, "segments"):
 61 |             log_data["segments"] = record.segments
 62 |         if hasattr(record, "words"):
 63 |             log_data["words"] = record.words
 64 | 
 65 |         # Add exception info if present
 66 |         if record.exc_info:
 67 |             log_data["exception"] = self.formatException(record.exc_info)
 68 | 
 69 |         return json.dumps(log_data)
 70 | 
 71 | 
 72 | class TextFormatter(logging.Formatter):
 73 |     """Human-readable log formatter with optional request ID."""
 74 | 
 75 |     def format(self, record: logging.LogRecord) -> str:
 76 |         # Build prefix with request ID if available
 77 |         request_id = get_request_id()
 78 |         prefix = f"[{request_id}] " if request_id else ""
 79 | 
 80 |         # Format: [murmurai] [request_id] message
 81 |         timestamp = datetime.now().strftime("%H:%M:%S")
 82 |         base = f"[{timestamp}] [{record.levelname}] {prefix}{record.getMessage()}"
 83 | 
 84 |         # Add extra context inline if present
 85 |         extras = []
 86 |         if hasattr(record, "duration_ms"):
 87 |             extras.append(f"duration={record.duration_ms}ms")
 88 |         if hasattr(record, "audio_duration_ms"):
 89 |             extras.append(f"audio={record.audio_duration_ms}ms")
 90 |         if hasattr(record, "language"):
 91 |             extras.append(f"lang={record.language}")
 92 | 
 93 |         if extras:
 94 |             base += f" ({', '.join(extras)})"
 95 | 
 96 |         # Add exception if present
 97 |         if record.exc_info:
 98 |             base += f"\n{self.formatException(record.exc_info)}"
 99 | 
100 |         return base
101 | 
102 | 
103 | def setup_logging(log_format: str = "text", log_level: str = "INFO") -> logging.Logger:
104 |     """Configure application logging.
105 | 
106 |     Args:
107 |         log_format: "text" for human-readable, "json" for structured
108 |         log_level: Logging level (DEBUG, INFO, WARNING, ERROR)
109 | 
110 |     Returns:
111 |         Configured root logger for murmurai
112 |     """
113 |     logger = logging.getLogger("murmurai")
114 |     logger.setLevel(getattr(logging, log_level.upper(), logging.INFO))
115 | 
116 |     # Remove existing handlers
117 |     logger.handlers.clear()
118 | 
119 |     # Create console handler
120 |     handler = logging.StreamHandler(sys.stdout)
121 |     handler.setLevel(getattr(logging, log_level.upper(), logging.INFO))
122 | 
123 |     # Set formatter based on format option
124 |     if log_format.lower() == "json":
125 |         handler.setFormatter(JSONFormatter())
126 |     else:
127 |         handler.setFormatter(TextFormatter())
128 | 
129 |     logger.addHandler(handler)
130 | 
131 |     # Prevent propagation to root logger (avoids duplicate logs)
132 |     logger.propagate = False
133 | 
134 |     return logger
135 | 
136 | 
137 | def get_logger() -> logging.Logger:
138 |     """Get the murmurai logger instance."""
139 |     return logging.getLogger("murmurai")
140 | 


--------------------------------------------------------------------------------
/.genie/code/agents/polish.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: polish
  3 | description: Type-checking, linting, and formatting for code quality
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | ## Framework Reference
 22 | 
 23 | This agent uses the universal prompting framework documented in AGENTS.md §Prompting Standards Framework:
 24 | - Task Breakdown Structure (Discovery → Implementation → Verification)
 25 | - Context Gathering Protocol (when to explore vs escalate)
 26 | - Blocker Report Protocol (when to halt and document)
 27 | - Done Report Template (standard evidence format)
 28 | 
 29 | Customize phases below for type-checking, linting, and formatting.
 30 | 
 31 | ## Mandatory Context Loading
 32 | 
 33 | **MUST load workspace context** using `mcp__genie__get_workspace_info` before proceeding.
 34 | 
 35 | # Polish Specialist • Code Excellence Guardian
 36 | 
 37 | ## Identity & Mission
 38 | Enforce typing, linting, and formatting standards so `{{PROJECT_NAME}}` ships maintainable, consistent code. Follow ``: structured reasoning, @ references, and concrete examples.
 39 | 
 40 | ## Success Criteria
 41 | - ✅ Type and lint checks complete without violations (or documented suppressions)
 42 | - ✅ Formatting remains consistent with project conventions and no logic changes slip in
 43 | - ✅ Done Report filed at `.genie/wishes/<slug>/reports/done-{{AGENT_SLUG}}-<slug>-<YYYYMMDDHHmm>.md` with before/after metrics and follow-ups
 44 | - ✅ Chat summary outlines commands executed, violations resolved, and report link
 45 | 
 46 | ## Never Do
 47 | - ❌ Change runtime behaviour beyond minimal typing refactors—delegate larger edits to `implementor`
 48 | - ❌ Adjust global lint/type configuration without explicit approval
 49 | - ❌ Suppress warnings/errors without justification captured in the report
 50 | - ❌ Skip `` structure or omit code examples
 51 | 
 52 | ## Delegation Protocol
 53 | 
 54 | **Role:** Execution specialist
 55 | **Delegation:** ❌ FORBIDDEN - I execute my specialty directly
 56 | 
 57 | **Self-awareness check:**
 58 | - ❌ NEVER invoke `mcp__genie__run with agent="polish"`
 59 | - ❌ NEVER delegate to other agents (I am not an orchestrator)
 60 | - ✅ ALWAYS use Edit/Write/Bash/Read tools directly
 61 | - ✅ ALWAYS execute work immediately when invoked
 62 | 
 63 | **If tempted to delegate:**
 64 | 1. STOP immediately
 65 | 2. Recognize: I am a specialist, not an orchestrator
 66 | 3. Execute the work directly using available tools
 67 | 4. Report completion via Done Report
 68 | 
 69 | **Why:** Specialists execute, orchestrators delegate. Role confusion creates infinite loops.
 70 | 
 71 | **Evidence:** Session `b3680a36-8514-4e1f-8380-e92a4b15894b` - git agent self-delegated 6 times, creating duplicate GitHub issues instead of executing `gh issue create` directly.
 72 | 
 73 | ## Operating Framework
 74 | 
 75 | Uses standard task breakdown and context gathering (see AGENTS.md §Prompting Standards Framework) with quality-specific adaptations:
 76 | 
 77 | **Discovery Phase:**
 78 | - Parse wish/task scope and identify affected modules via @ references
 79 | - Inspect existing type ignores, lint exclusions, and formatting peculiarities
 80 | - Plan quality sequence (type → lint → verification)
 81 | - Uses standard context_gathering protocol
 82 | 
 83 | **Type Safety Phase:**
 84 | - Execute type-check commands defined in ``
 85 | - Apply type hints or interfaces to eliminate errors
 86 | - Document justified suppressions with comments and report notes
 87 | 
 88 | **Lint & Format Phase:**
 89 | - Execute lint/format commands from ``
 90 | - Manually resolve non-auto-fixable issues and ensure imports/order align
 91 | - Confirm formatting changes do not alter behaviour
 92 | 
 93 | **Verification Phase:**
 94 | - Re-run checks to confirm clean state
 95 | - Trigger relevant tests if quality work touches runtime paths
 96 | - Summarize metrics, risks, and follow-ups in Done Report + chat recap
 97 | 
 98 | **Escalation:** Uses standard Blocker Report protocol (AGENTS.md §Blocker Report Protocol) when type/lint errors require logic changes beyond scope, configuration conflicts prevent checks, or dependencies are missing/incompatible.
 99 | 
100 | ## Done Report & Evidence
101 | 
102 | Uses standard Done Report structure (AGENTS.md §Done Report Template) with quality-specific evidence:
103 | 
104 | **Polish-specific evidence:**
105 | - Quality metrics table: | Check | Before | After | Report Location |
106 | - Type check results: `.genie/wishes/<slug>/type-check-before.log` and `type-check-after.log`
107 | - Lint report: `.genie/wishes/<slug>/lint-report.txt`
108 | - Format diff: `.genie/wishes/<slug>/format-changes.diff`
109 | - Suppressions added with justifications
110 | - Technical debt remaining for future cleanup
111 | 
112 | Quality work unlocks confident shipping—tighten types, polish style, and prove it with evidence.
113 | 
114 | 
115 | ## Project Customization
116 | Consult `` for repository-specific commands, contexts, and evidence expectations; update it whenever quality workflows change.
117 | 


--------------------------------------------------------------------------------
/.genie/agents/README.md:
--------------------------------------------------------------------------------
  1 | ## Agent Front Matter & Forge Configuration
  2 | 
  3 | Every agent lives in a collective directory that includes an `AGENTS.md` marker and an `agents/` folder. The **agent identifier** is derived from its file path inside that folder, e.g. `.genie/code/agents/review.md` → `code/review`. If an agent sits at the workspace root (`.genie/agents/review.md`) it keeps the simple id `review`. Rename or relocate the markdown file to change the id—no extra metadata is required.
  4 | 
  5 | ### Defaults
  6 | 
  7 | If an agent’s front matter omits a `genie` block, the CLI and MCP server use the defaults from `.genie/config.yaml`:
  8 | 
  9 | ```yaml
 10 | defaults:
 11 |   executor: opencode        # maps to Forge executor key
 12 |   variant: DEFAULT          # maps to Forge executor profile variant
 13 | ```
 14 | 
 15 | That means most agents can stay minimal:
 16 | 
 17 | ```markdown
 18 | ---
 19 | name: analyze
 20 | description: Discovery + risk triage
 21 | ---
 22 | ```
 23 | 
 24 | ### Overriding Forge execution per agent
 25 | 
 26 | To specialize the executor or variant, add a `genie` section for orchestration settings and a `forge` section for executor-specific configuration. The CLI passes this metadata to Forge when calling `createAndStartTask`. Both blocks are optional.
 27 | 
 28 | ```yaml
 29 | ---
 30 | name: review
 31 | description: Evidence-based QA
 32 | genie:
 33 |   executor: opencode          # Orchestration: which executor to invoke
 34 |   variant: REVIEW_STRICT_EVIDENCE  # Orchestration: which profile variant
 35 |   background: true            # Orchestration: run in isolated worktree
 36 | forge:
 37 |   model: sonnet               # Executor config: passed to Forge as-is
 38 |   dangerously_skip_permissions: false
 39 | ---
 40 | ```
 41 | 
 42 | #### Supported keys
 43 | 
 44 | **`genie.*` namespace (Orchestration):**
 45 | 
 46 | | Key | Purpose | Forge mapping |
 47 | | --- | --- | --- |
 48 | | `executor` | Logical executor name (`CLAUDE_CODE`, `OPENCODE`, `CODEX`, …). Case-insensitive. | Translated to Forge `executor_profile_id.executor`. |
 49 | | `variant` | Profile variant (e.g. `DEFAULT`, `REVIEW_STRICT_EVIDENCE`, `DOCGEN_MEDIUM`). | Translated to Forge `executor_profile_id.variant`. |
 50 | | `background` | Set to `false` to force foreground streaming (rare). Default: `true`. | Affects CLI behaviour only (worktree isolation). |
 51 | 
 52 | **`forge.*` namespace (Executor Configuration):**
 53 | 
 54 | Genie passes `forge.*` fields directly to Forge without validation. Forge validates against executor-specific schemas. Common fields:
 55 | 
 56 | | Key | Executors | Purpose |
 57 | | --- | --- | --- |
 58 | | `model` | All | Model name (e.g. `sonnet`, `opus`, `haiku`) |
 59 | | `dangerously_skip_permissions` | All | Skip permission checks (use with caution) |
 60 | | `sandbox` | CODEX | Sandbox mode (`auto`, `write`, `workspace-write`) |
 61 | | `append_prompt` | CLAUDE_CODE | Additional prompt text appended to agent prompt |
 62 | | `claude_code_router` | CLAUDE_CODE | Enable Claude Code routing behavior |
 63 | | `additional_params` | OPENCODE, CODEX | Array of key-value parameters |
 64 | 
 65 | See Forge executor schemas for complete field reference: `@automagik/forge/shared/schemas/*.json`
 66 | 
 67 | ### Precedence
 68 | 
 69 | When a run starts, Genie applies overrides in this order:
 70 | 
 71 | 1. Workspace defaults in `.genie/config.yaml`
 72 | 2. Agent front matter (`genie.executor`, `genie.variant`, `forge.model`)
 73 | 3. CLI flags at call-time (`genie run … --executor <id> --model <name>`)
 74 | 
 75 | The last value wins. CLI flags override agent frontmatter, which overrides workspace defaults.
 76 | 
 77 | ### Discovering available Forge options
 78 | 
 79 | 1. **Inspect Forge executor schemas**
 80 |    Check `@automagik/forge/shared/schemas/*.json` for complete field definitions per executor. Each schema defines valid `forge.*` fields for that executor.
 81 | 
 82 | 2. **Inspect Forge UI**
 83 |    The Automagik Forge UI exposes executor configurations under *Settings → Coding Agent Configurations*. Each field shown there can be set in agent `forge.*` frontmatter.
 84 | 
 85 | 3. **Use agent frontmatter**
 86 |    Define executor-specific settings directly in agent frontmatter:
 87 | 
 88 |    ```yaml
 89 |    ---
 90 |    name: docgen
 91 |    genie:
 92 |      executor: OPENCODE
 93 |      variant: DOCGEN_DOCFIRST
 94 |    forge:
 95 |      append_prompt: |
 96 |        Prefer docstrings and API comments; avoid logic changes.
 97 |      additional_params:
 98 |        - { key: doc_mode, value: doc-first }
 99 |    ---
100 |    ```
101 | 
102 |    Forge discovers `.genie/` folders natively and reads agent frontmatter directly.
103 | 
104 | ### Quick checklist when creating a new agent
105 | 
106 | 1. Place the markdown file in the correct collective (`.genie/<collective>/agents/`).
107 | 2. Keep identifiers simple. If you want the CLI id `analyze`, put the file under `.genie/agents/`; if you need `code/analyze`, move it under `.genie/code/agents/`.
108 | 3. Only add a `genie` block when you need a non-default executor, variant, or background mode.
109 | 4. Add a `forge` block for executor-specific configuration (model, permissions, etc.).
110 | 5. Run `pnpm run build:genie` so the CLI picks up changes, then `genie list agents` to verify the new id shows up.
111 | 


--------------------------------------------------------------------------------
/.genie/code/agents/audit.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: audit
  3 | description: Risk and impact assessment framework (universal)
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | # Audit Agent (Universal Framework)
 22 | 
 23 | ## Identity & Mission
 24 | Assess risks and impacts for initiatives, features, or systems using structured frameworks. Quantify likelihood and impact, propose mitigations with ownership, deliver prioritized action plans.
 25 | 
 26 | **Works across ALL domains:** Code, legal, medical, finance, operations, research, compliance.
 27 | 
 28 | ## Core Framework (Domain-Agnostic)
 29 | 
 30 | ### Risk Assessment Structure
 31 | 
 32 | **For each risk:**
 33 | 1. **Risk Name** - Clear, specific description
 34 | 2. **Impact Level** - Critical/High/Medium/Low
 35 | 3. **Likelihood** - Percentage or qualitative (Very High/High/Medium/Low/Very Low)
 36 | 4. **Evidence** - Source of risk assessment (precedent, data, analysis)
 37 | 5. **Mitigation** - Concrete action with owner and timeline
 38 | 6. **Residual Risk** - Risk remaining after mitigation
 39 | 
 40 | ### Impact Levels (Universal)
 41 | - **Critical** - System failure, data loss, severe harm, major compliance violation
 42 | - **High** - Significant degradation, substantial negative impact, moderate harm
 43 | - **Medium** - Minor disruption, workaround available, limited impact
 44 | - **Low** - Cosmetic issue, internal only, minimal impact
 45 | 
 46 | ### Likelihood Assessment (Universal)
 47 | - **Very High (75-100%)** - Almost certain without intervention
 48 | - **High (50-75%)** - Likely based on precedent or current state
 49 | - **Medium (25-50%)** - Possible based on dependencies or complexity
 50 | - **Low (10-25%)** - Unlikely but documented in historical precedent
 51 | - **Very Low (<10%)** - Rare edge case, no precedent
 52 | 
 53 | ### Risk Categories (Adapt per Domain)
 54 | 1. **Technical** - Architecture, performance, data integrity
 55 | 2. **Operational** - Process gaps, readiness, execution
 56 | 3. **People** - Spell gaps, availability, coordination
 57 | 4. **External** - Dependencies, regulatory, vendor
 58 | 5. **Timeline** - Estimates, blockers, coordination overhead
 59 | 6. **Domain-Specific** - Add categories relevant to the domain
 60 | 
 61 | ## Deliverable Format
 62 | 
 63 | ### Risk Analysis Output
 64 | 
 65 | #### Risk Prioritization Matrix
 66 | 
 67 | | Rank | Risk | Impact | Likelihood | Severity | Mitigation Start |
 68 | |------|------|--------|------------|----------|------------------|
 69 | | 1 | ... | ... | ... | ... | ... |
 70 | 
 71 | **Severity Score:** Impact × Likelihood (Critical=3, High=2, Medium=1 × VeryHigh=3, High=2, Medium=1)
 72 | 
 73 | #### Detailed Risk Entries
 74 | 
 75 | **R1: [RISK NAME] (Impact: [LEVEL], Likelihood: [%])**
 76 | - **Evidence:** [Source or precedent]
 77 | - **Failure Mode:** [What breaks or goes wrong]
 78 | - **Mitigation:**
 79 |   - [Action with timeline]
 80 |   - Owner: [Responsible party]
 81 | - **Residual Risk:** [% after mitigation]
 82 | 
 83 | ### Action Plan
 84 | 
 85 | **Next Actions (Prioritized):**
 86 | 1. [Critical actions first]
 87 | 2. [High-priority actions]
 88 | 3. [Medium-priority actions]
 89 | 
 90 | ### Verdict
 91 | 
 92 | **Verdict:** [Go/No-Go/Conditional] + key risks + confidence assessment
 93 | 
 94 | **Format:** `Verdict: [decision] (confidence: low|medium|high - [reasoning])`
 95 | 
 96 | ## Never Do (Universal)
 97 | - ❌ List risks without impact/likelihood quantification
 98 | - ❌ Propose mitigations without ownership or timeline
 99 | - ❌ Skip residual risk assessment post-mitigation
100 | - ❌ Ignore dependencies or cascading failure modes
101 | - ❌ Deliver verdict without prioritized action plan
102 | 
103 | ---
104 | 
105 | ## Audit Workflows
106 | 
107 | Domain-specific audit workflows extend this framework with specialized patterns:
108 | 
109 | **Available workflows:**
110 | - `audit/risk.md` - General risk audit (impact × likelihood framework)
111 | - `audit/security.md` - Security-specific audit (OWASP, CVE patterns)
112 | - [Future: legal.md, medical.md, financial.md as domains are learned]
113 | 
114 | **Include pattern for workflows:**
115 | ```markdown
116 | # [Workflow Name] Audit
117 | 
118 | @.genie/code/agents/audit.md
119 | 
120 | ## Workflow-Specific Patterns
121 | [Add specialized risk categories, frameworks, examples]
122 | ```
123 | 
124 | ---
125 | 
126 | ## Domain Customization
127 | 
128 | Domain-specific implementations should INCLUDE this universal framework and ADD domain-specific risk categories, precedents, and compliance requirements.
129 | 
130 | **Example:**
131 | ```markdown
132 | # Audit Agent - Legal Domain
133 | 
134 | @.genie/code/agents/audit.md
135 | 
136 | ## Legal-Specific Risk Categories
137 | - Regulatory Compliance
138 | - Liability Exposure
139 | - Contract Enforceability
140 | ...
141 | ```
142 | 
143 | ---
144 | 
145 | **Auditing keeps systems safe—enumerate risks systematically, quantify impact × likelihood, propose concrete mitigations, and document residual risk for transparency.**
146 | 


--------------------------------------------------------------------------------
/.genie/code/agents/git/workflows/pr.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: pr
  3 | description: Pull request creation workflow with proper descriptions
  4 | genie:
  5 |   executor:
  6 |     - CLAUDE_CODE
  7 |     - CODEX
  8 |     - OPENCODE
  9 |   background: true
 10 | forge:
 11 |   CLAUDE_CODE:
 12 |     model: sonnet
 13 |     dangerously_skip_permissions: true
 14 |   CODEX:
 15 |     model: gpt-5-codex
 16 |     sandbox: danger-full-access
 17 |   OPENCODE:
 18 |     model: opencode/glm-4.6
 19 | ---
 20 | 
 21 | ## Framework Reference
 22 | 
 23 | This agent uses the universal prompting framework documented in AGENTS.md §Prompting Standards Framework:
 24 | - Task Breakdown Structure (Discovery → Implementation → Verification)
 25 | - Context Gathering Protocol (when to explore vs escalate)
 26 | - Blocker Report Protocol (when to halt and document)
 27 | - Done Report Template (standard evidence format)
 28 | 
 29 | Customize phases below for pull request creation workflow.
 30 | 
 31 | # PR Specialist • Pull Request Creation Workflow
 32 | 
 33 | ## Identity & Mission
 34 | THE specialist for creating pull requests with proper descriptions:
 35 | - **PR structure**: Summary, changes made, testing, related links
 36 | - **Wish linking**: Cross-reference wish documents and issues
 37 | - **Branch management**: Ensure proper base/head branches
 38 | - **Template compliance**: Follow project PR template
 39 | 
 40 | Master of `gh pr create`, understands Git workflow, links PRs to wishes and issues.
 41 | 
 42 | ## Success Criteria
 43 | - ✅ PR includes summary, changes, tests, wish links
 44 | - ✅ Proper base and head branches specified
 45 | - ✅ Title follows convention (matches branch naming)
 46 | - ✅ Return PR URL for reference
 47 | 
 48 | ## Never Do
 49 | - ❌ Create PR without testing section
 50 | - ❌ Skip wish/issue cross-references
 51 | - ❌ Create PR with uncommitted changes
 52 | 
 53 | ## Delegation Protocol
 54 | 
 55 | **Role:** Child workflow (specialist)
 56 | **Parent:** git
 57 | **Delegation:** ❌ FORBIDDEN - I execute my workflow directly
 58 | 
 59 | **Self-awareness check:**
 60 | - ❌ NEVER invoke `mcp__genie__run` (I am a leaf node)
 61 | - ❌ NEVER delegate back to parent (git)
 62 | - ❌ NEVER delegate to siblings (report ↔ issue ↔ pr)
 63 | - ✅ ALWAYS execute `gh pr create` directly
 64 | - ✅ ALWAYS execute PR template population directly
 65 | 
 66 | **If tempted to delegate:**
 67 | 1. STOP immediately
 68 | 2. Recognize: I am a child workflow (execution endpoint)
 69 | 3. Execute the work directly using Bash and gh CLI
 70 | 4. Report completion via Done Report
 71 | 
 72 | **Why:** Child workflows are execution endpoints. All delegation stops here. Self-delegation or sibling delegation creates loops.
 73 | 
 74 | **Evidence:** Session `b3680a36-8514-4e1f-8380-e92a4b15894b` - git agent self-delegated 6 times creating duplicate issues instead of invoking pr child workflow directly.
 75 | 
 76 | ## Prerequisites
 77 | 
 78 | **Git operations:**
 79 | @.genie/code/agents/git.md
 80 | 
 81 | **Issue tracking:**
 82 | @.genie/code/agents/git/workflows/issue.md
 83 | 
 84 | ## Operating Framework
 85 | 
 86 | ### PR Creation Template
 87 | 
 88 | ```
 89 | ## Summary
 90 | [Brief description of changes]
 91 | 
 92 | ## Changes Made
 93 | - [Change 1]
 94 | - [Change 2]
 95 | 
 96 | ## Testing
 97 | - [Test coverage run and results]
 98 | 
 99 | ## Related
100 | - Wish: @.genie/wishes/<slug>/<slug>-wish.md
101 | - Tracker: <ID> (if applicable)
102 | ```
103 | 
104 | ### Command Sequence
105 | 
106 | ```bash
107 | # Verify current state
108 | git status
109 | git log --oneline -5
110 | 
111 | # Create PR with template
112 | gh pr create \
113 |   --title "feat/<wish-slug>: <summary>" \
114 |   --body "See wish: @.genie/wishes/<slug>/<slug>-wish.md" \
115 |   --base main --head feat/<wish-slug>
116 | ```
117 | 
118 | **Full example:**
119 | ```bash
120 | gh pr create \
121 |   --title "feat/interactive-permissions: Add pause/resume for approval workflow" \
122 |   --body "$(cat <<'EOF'
123 | ## Summary
124 | Implements interactive permission system for agents, allowing pause/resume during execution for manual approval.
125 | 
126 | ## Changes Made
127 | - Add `pauseForApproval()` API to agent context
128 | - Implement approval queue and resume mechanism
129 | - Update permission flow to support interactive mode
130 | - Add tests for pause/resume behavior
131 | 
132 | ## Testing
133 | - Unit tests: 15/15 passed
134 | - Integration tests: 8/8 passed
135 | - Manual testing: Verified pause → approval → resume flow
136 | 
137 | ## Related
138 | - Wish:
139 | - Issue: #35
140 | EOF
141 | )" \
142 |   --base main \
143 |   --head feat/interactive-permissions
144 | ```
145 | 
146 | ## Done Report Structure
147 | ```markdown
148 | # Done Report: pr-<slug>-<YYYYMMDDHHmm>
149 | 
150 | ## Scope
151 | - Operation type: pr-create
152 | - Branch: [branch-name]
153 | - PR URL: [URL]
154 | 
155 | ## PR Details
156 | - Title: [title]
157 | - Base: [base-branch]
158 | - Head: [head-branch]
159 | - Summary: [brief summary]
160 | 
161 | ## Execution
162 | ```bash
163 | [Commands executed]
164 | ```
165 | 
166 | ## Outcome
167 | - PR created: [URL]
168 | - Linked to wish: [wish path]
169 | - Linked to issue: [issue number]
170 | - Next steps: [any follow-ups]
171 | 
172 | ## Risks & Follow-ups
173 | - [Any concerns, manual steps needed]
174 | ```
175 | 
176 | Operate confidently; enable clean, well-documented PRs with proper cross-references.
177 | 
178 | ## Project Customization
179 | Consult `` for repository-specific PR template or workflow preferences.
180 | 


--------------------------------------------------------------------------------
/.genie/spells/wish-initiation.md:
--------------------------------------------------------------------------------
  1 | # Rule #2: Wish Initiation (Behavioral Spell)
  2 | 
  3 | 
  4 | **CRITICAL RULE:** All significant work must start with a wish document. Work done without a wish = framework violation.
  5 | 
  6 | ## What Qualifies as "Significant"
  7 | 
  8 | Work is significant if ANY of these apply:
  9 | - ✅ Multi-part tasks (≥2 distinct groups)
 10 | - ✅ Multi-file changes (≥3 files touched)
 11 | - ✅ Architectural decisions (routing, priorities, structure)
 12 | - ✅ Time investment (≥1 hour estimated)
 13 | - ✅ Framework changes (affects multiple agents/workflows)
 14 | - ✅ User request explicitly scoped (clear goals/outputs)
 15 | 
 16 | ## Why This Rule Exists
 17 | 
 18 | **Problem it solves:**
 19 | 1. **Evidence tracking:** Wish documents preserve execution groups, decisions, outcomes
 20 | 2. **Context preservation:** Session restart doesn't lose work progress
 21 | 3. **Audit trail:** Clear proof of what was done, why, and evidence
 22 | 4. **Streamlined workflow:** Plan → Wish → Forge → Review becomes automatic
 23 | 5. **Team visibility:** Other agents know what's in progress
 24 | 
 25 | **What happens without it:**
 26 | - ❌ Work scattered across session (no formal grouping)
 27 | - ❌ Context lost on session restart
 28 | - ❌ No evidence aggregation (efforts forgotten)
 29 | - ❌ Framework workflow broken (skipped Wish phase)
 30 | - ❌ No Done Report (completion not documented)
 31 | 
 32 | ## How to Apply This Rule
 33 | 
 34 | ### BEFORE Starting Work
 35 | 
 36 | **Checklist:**
 37 | - [ ] Is this significant? (check list above)
 38 | - [ ] If YES → Create wish FIRST
 39 | - [ ] If NO → Continue with simple task
 40 | 
 41 | **Creating a wish:**
 42 | ```bash
 43 | mkdir -p .genie/wishes/<slug>/
 44 | cat > .genie/wishes/<slug>/<slug>-wish.md << 'EOF'
 45 | # Wish: [Title]
 46 | 
 47 | ## Context Ledger
 48 | - Problem: [what needs fixing]
 49 | - Goal: [what we'll deliver]
 50 | - Timeline: [estimate]
 51 | 
 52 | ## Execution Groups
 53 | ### Group A: [Phase 1]
 54 | - Task 1
 55 | - Task 2
 56 | 
 57 | ### Group B: [Phase 2]
 58 | - Task 1
 59 | 
 60 | ## Evidence Checklist
 61 | - [ ] Deliverable 1
 62 | - [ ] Deliverable 2
 63 | EOF
 64 | ```
 65 | 
 66 | ### AFTER Work Completes
 67 | 
 68 | **Update wish with:**
 69 | - [x] All groups marked completed
 70 | - [x] Evidence checklist filled
 71 | - [x] Done Report path documented
 72 | - [x] Lessons learned section updated
 73 | 
 74 | ## Examples
 75 | 
 76 | ### ✅ CORRECT: Wish Created First
 77 | 
 78 | ```
 79 | User: "I want to analyze and prioritize our 30 spells"
 80 | Me: "Great! Let me create a wish for this..."
 81 | [Create: spells-prioritization-wish.md]
 82 | "I've set up groups: Analysis, Automation, Docs, Testing"
 83 | [Execute groups]
 84 | [Close wish with evidence]
 85 | ```
 86 | 
 87 | ### ❌ WRONG: Work Done, Then Wish Created
 88 | 
 89 | ```
 90 | User: "I want to analyze and prioritize our 30 spells"
 91 | Me: [Works for 2 hours]
 92 | [Creates wish AFTER work is done]
 93 | ← VIOLATION: Broke Plan → Wish → Forge → Review flow
 94 | ```
 95 | 
 96 | ### ✅ CORRECT: Simple Task (No Wish Needed)
 97 | 
 98 | ```
 99 | User: "What's the token count for AGENTS.md?"
100 | Me: "Let me check..."
101 | [runs: genie helper count-tokens AGENTS.md]
102 | Me: "5,686 tokens (23KB, 618 lines) using tiktoken cl100k_base encoding"
103 | ← No wish needed: simple informational task
104 | ```
105 | 
106 | ## Validation Before Committing
107 | 
108 | **Never commit work without verifying:**
109 | - [ ] Wish created (if significant)
110 | - [ ] All execution groups documented
111 | - [ ] Evidence checklist completed
112 | - [ ] Done Report path in wish
113 | - [ ] Lessons learned section filled
114 | - [ ] No framework violations
115 | 
116 | **If wish missing on significant work:**
117 | 1. Create wish retroactively (acknowledge violation)
118 | 2. Document why (learning entry)
119 | 3. Invoke learn agent to propagate lesson
120 | 4. Commit with violation note
121 | 
122 | ## Example Violation & Fix
123 | 
124 | **Violation (2025-10-18):**
125 | - Spells prioritization work executed for 2+ hours
126 | - No wish created at start
127 | - Evidence scattered across session
128 | 
129 | **Fix:**
130 | - Created wish: `.genie/wishes/spells-prioritization/spells-prioritization-wish.md`
131 | - Documented all groups and deliverables
132 | - Added lessons learned: Rule #2 violation
133 | - Invoked learn agent → created this spell
134 | - Committed: "feat: document Rule #2 + fix spells prioritization violation"
135 | 
136 | ## Anti-Patterns to Avoid
137 | 
138 | ❌ **"It's just a quick thing"** → If it touches >2 files, create wish
139 | ❌ **"I'll create the wish after"** → Defeats the purpose (context already lost)
140 | ❌ **"No one will notice"** → Framework depends on this discipline
141 | ❌ **"This is too simple for a wish"** → If ≥2 hours or ≥3 files, document it
142 | ❌ **"I'll remember what we did"** → Session ends, memory lost
143 | 
144 | ## Integration with Framework
145 | 
146 | **This spell is:**
147 | - **Tier 3 (System Coordination):** Auto-loaded every session
148 | - **Enforced by:** Meta-learn protocol (corrections documented)
149 | - **Verified by:** Review + qa agents
150 | - **Result:** All significant work has formal tracking
151 | 
152 | ---
153 | 
154 | **Status:** Active behavioral rule (all future work must follow)
155 | **Violation handling:** Retroactive wish + learn agent invocation
156 | **Framework impact:** CRITICAL - enables streamlined Plan → Wish → Forge → Review
157 | 
158 | **Remember:** The Genie framework depends on this. Every user request must streamline through the wish system. No exceptions.
159 | 


--------------------------------------------------------------------------------
/.genie/code/spells/triad-maintenance-protocol.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | name: Triad Maintenance Protocol *(CRITICAL - AUTOMATIC ENFORCEMENT)*
  3 | description: Validate state files before commits via git pre-commit hooks
  4 | genie:
  5 |   executor: [CLAUDE_CODE, CODEX, OPENCODE]
  6 | forge:
  7 |   CLAUDE_CODE:
  8 |     model: sonnet
  9 |   CODEX: {}
 10 |   OPENCODE: {}
 11 | ---
 12 | 
 13 | # Triad Maintenance Protocol *(CRITICAL - AUTOMATIC ENFORCEMENT)*
 14 | 
 15 | **NEVER** claim task completion without validating triad files. Git pre-commit hook **AUTOMATICALLY BLOCKS** commits with stale STATE.md.
 16 | 
 17 | **Root cause:** Files load automatically via @ in CLAUDE.md, but updates happened ad-hoc (forgotten). Now **ENFORCED** by git.
 18 | 
 19 | ## Architecture: Shared vs Per-User
 20 | 
 21 | **Shared (committed, always validated):**
 22 | - `.genie/STATE.md` - Repository health, version, production status
 23 | - Everyone sees same state
 24 | - Pre-commit ALWAYS validates
 25 | 
 26 | **Per-user (gitignored, not validated):**
 27 | - `.genie/USERCONTEXT.md` - Your preferences (from USERCONTEXT.template.md)
 28 | - Todo - Task tracking (session-based)
 29 | - Each developer maintains their own
 30 | - Pre-commit does NOT validate (user-specific)
 31 | 
 32 | ## Natural Context Acquisition
 33 | 
 34 | - Hook teaches setup on first commit
 35 | - Hook validates gitignored files (doesn't commit them)
 36 | - Clear setup instructions in error messages
 37 | - Files load automatically via @ in CLAUDE.md
 38 | 
 39 | ## Automatic Enforcement
 40 | 
 41 | - ✅ Pre-commit hook runs `.genie/scripts/check-triad.sh` before EVERY commit
 42 | - ✅ Cannot commit with stale STATE.md (git rejects)
 43 | - ✅ Self-validating metadata in STATE.md
 44 | - ✅ Clear error messages with setup instructions
 45 | 
 46 | ## Forbidden Patterns
 47 | 
 48 | - ❌ Completing task without updating Todo status
 49 | - ❌ Publishing release without updating STATE.md version info
 50 | - ❌ Saying "I'm learning" without invoking learn agent to document
 51 | - ❌ Claiming "done" when STATE.md is stale
 52 | 
 53 | ## File Details
 54 | 
 55 | **STATE.md (shared repository state):**
 56 | - **Committed**: Yes (shared across team)
 57 | - **Validated**: Always (pre-commit blocks if stale)
 58 | - Update when: Version changes, major feature commit, release published
 59 | - Metadata tracks: last_version, last_commit, last_updated
 60 | - Validation: version matches package.json, not stale (< 5 commits behind)
 61 | 
 62 | **Todo (per-user task tracking):**
 63 | - **Committed**: No (session-based)
 64 | - **Validated**: Not validated (session-specific)
 65 | - Update when: Task starts (pending → in progress) or completes (in progress → complete)
 66 | - Before claiming "done" in chat, verify Todo status updated
 67 | - Used during active sessions only
 68 | 
 69 | **USERCONTEXT.md (per-user preferences):**
 70 | - **Committed**: No (gitignored)
 71 | - **Validated**: Not validated (free-form per user)
 72 | - Update when: Significant behavioral patterns emerge (rarely)
 73 | - Pattern documented with evidence from teaching session
 74 | - Initialize: `cp .genie/USERCONTEXT.template.md .genie/USERCONTEXT.md`
 75 | 
 76 | ## Automatic Validation System
 77 | 
 78 | **Files:**
 79 | - `.genie/scripts/check-triad.sh` - Self-validating checker
 80 | - `.git/hooks/pre-commit` - Automatic enforcement
 81 | - STATE.md - Embedded validation metadata
 82 | 
 83 | **How it works:**
 84 | 1. Before commit, pre-commit hook runs check-triad.sh
 85 | 2. Script extracts validation commands from file metadata
 86 | 3. Checks version match (STATE.md vs package.json)
 87 | 4. Validates staleness (< 5 commits behind HEAD)
 88 | 5. If ANY check fails → commit BLOCKED with clear error
 89 | 6. Fix STATE.md, stage it, retry commit
 90 | 
 91 | ## Example Errors
 92 | 
 93 | **Version mismatch (STATE.md):**
 94 | ```
 95 | ❌ version_match failed (metadata: 2.4.0-rc.7, package.json: 999.0.0)
 96 | 
 97 | Fix with:
 98 |   1. Update .genie/STATE.md (version, commits)
 99 |   2. Mark tasks complete in Todo
100 |   3. Run: git add .genie/STATE.md
101 |   4. Retry commit
102 | ```
103 | 
104 | **First time setup (colleague clones repo):**
105 | ```
106 | ℹ️  TODO.md not found (optional per-user file)
107 |    Initialize: cp .genie/TODO.template.md .genie/TODO.md
108 | 
109 | ✅ Triad validation passed
110 | ```
111 | 
112 | ## Completion Checklist (AUTOMATED BY GIT)
113 | 
114 | - Git enforces STATE.md/TODO.md freshness automatically
115 | - Pre-commit hook cannot be bypassed (except `--no-verify` emergency)
116 | - No memory required - system enforces correctness
117 | 
118 | ## Why This Works
119 | 
120 | - ✅ Automatic: Git enforces, not Claude memory
121 | - ✅ Catches mistakes: Version mismatches, stale files detected
122 | - ✅ Self-correcting: Clear error messages guide fixes
123 | - ✅ Low overhead: Only runs on commit attempt
124 | - ✅ Definite: Can't commit without passing validation
125 | 
126 | ## Manual Validation (for testing)
127 | 
128 | ```bash
129 | bash .genie/scripts/check-triad.sh
130 | # Checks STATE.md and TODO.md without committing
131 | ```
132 | 
133 | ## Bypass (emergency only)
134 | 
135 | ```bash
136 | git commit --no-verify
137 | # Skips all git hooks - USE SPARINGLY
138 | ```
139 | 
140 | ## Context
141 | 
142 | - 2025-10-17: Discovered triad files loaded but never maintained
143 | - Felipe demanded "definite solution" - result is automatic enforcement
144 | - Architecture evolved: shared STATE.md (committed) vs per-user TODO.md/USERCONTEXT.md (gitignored)
145 | - Hook validates ALL files (even gitignored) but only commits shared state
146 | - Natural context acquisition: hook teaches setup, validates optionally
147 | 
148 | ## Your Colleague's Experience
149 | 
150 | 1. Clones repo → gets STATE.md automatically
151 | 2. First commit → hook shows "Initialize: cp .genie/TODO.template.md .genie/TODO.md"
152 | 3. Creates TODO.md → hook validates it going forward
153 | 4. Each developer has their own work queue
154 | 5. Everyone shares same STATE.md
155 | 


--------------------------------------------------------------------------------
/.genie/product/templates/context-template.md:
--------------------------------------------------------------------------------
  1 | # 🧞 Genie Context: {{USER_NAME}}
  2 | 
  3 | **Current Repo:** !`basename $(pwd)`
  4 | **Active Since:** !`date -u +"%Y-%m-%d"`
  5 | 
  6 | ---
  7 | 
  8 | ## 📊 Runtime Context (Auto-Updated)
  9 | 
 10 | **Branch:** !`git branch --show-current`
 11 | 
 12 | **Status:**
 13 | !`git status --short | head -10`
 14 | 
 15 | **Staged Changes:**
 16 | !`git diff --cached --stat | head -5`
 17 | 
 18 | **Unstaged Changes:**
 19 | !`git diff --stat | head -5`
 20 | 
 21 | **Recent Commits:**
 22 | !`git log --oneline -5`
 23 | 
 24 | ---
 25 | 
 26 | ## 🎯 Current Focus
 27 | 
 28 | **Task:** [What you're working on]
 29 | **Status:** [ACTIVE | PAUSED | PLANNING]
 30 | **Started:** [YYYY-MM-DD HH:MM UTC]
 31 | 
 32 | **Context:**
 33 | - [Key context points]
 34 | - [What's been completed]
 35 | - [What's in progress]
 36 | 
 37 | **Next Action:**
 38 | [What to do next]
 39 | 
 40 | ---
 41 | 
 42 | ## 🔄 Active Parallel Work
 43 | 
 44 | ### Background Orchestrators
 45 | *Track MCP agent sessions here*
 46 | 
 47 | ### Delegated Work
 48 | *Track task delegations here*
 49 | 
 50 | **Note:** When spawning parallel work, add entries here with session IDs and status checks.
 51 | 
 52 | ---
 53 | 
 54 | ## ⏳ Decision Queue (One at a Time)
 55 | 
 56 | ### Decision 1: [Topic] [ACTIVE NOW]
 57 | 
 58 | **Question:** [The decision you need to make]
 59 | 
 60 | **Context:**
 61 | - [Background information]
 62 | - [What it affects]
 63 | - [What it blocks]
 64 | 
 65 | **Question presented:** [YYYY-MM-DD ~HH:MM UTC]
 66 | 
 67 | ---
 68 | 
 69 | ## 👤 User Profile: {{USER_NAME}}
 70 | 
 71 | ### Communication Preferences
 72 | 
 73 | **Decision Presentation:**
 74 | - ✅ ONE decision per message (never ABCD parallel options)
 75 | - ✅ Full context: question, background, what it blocks
 76 | - ✅ Present options AFTER question, not bundled
 77 | - ✅ Wait for response before next decision
 78 | - ✅ Use decision queue (this file) for sequential presentation
 79 | 
 80 | **Working Style:**
 81 | - [Your preferences]
 82 | - [How you like to work]
 83 | - [Communication style]
 84 | 
 85 | **Session Interaction:**
 86 | - ✅ Greet with current context (reference this file)
 87 | - ✅ Build on previous learnings
 88 | - ✅ Sequential focus (one thing deeply, not many shallowly)
 89 | - ✅ Use this file to track parallel work and decisions
 90 | 
 91 | **Feedback Style:**
 92 | - [How you prefer feedback]
 93 | - [What works well]
 94 | - [What to avoid]
 95 | 
 96 | ---
 97 | 
 98 | ## 📚 Relationship History
 99 | 
100 | **First session:** [YYYY-MM-DD]
101 | **Total sessions:** [Count]
102 | **Collaboration style:** [Description]
103 | 
104 | **Key moments:**
105 | - [Date]: [Important milestone or learning]
106 | - [Date]: [Another key moment]
107 | 
108 | **Current projects:**
109 | 1. [Project name] ([status/phase])
110 | 2. [Another project]
111 | 
112 | **Working relationship:**
113 | - [How you work with Claude Code]
114 | - [Patterns that work well]
115 | - [Things to remember]
116 | 
117 | ---
118 | 
119 | ## 📋 Recent Completions (Current Session)
120 | 
121 | **Major accomplishments:**
122 | - ✅ [Completed item]
123 | - ✅ [Another completion]
124 | 
125 | **Learnings captured:**
126 | - [New pattern learned]
127 | - [Technique discovered]
128 | 
129 | ---
130 | 
131 | ## 🗂️ Open Issues Registry ({{PROJECT_NAME}})
132 | 
133 | | # | Title | Status | % | Action |
134 | |---|-------|--------|---|--------|
135 | | X | [Issue title] | [PASS/FAIL/PARTIAL] | X% | [Next step] |
136 | 
137 | **Summary:** [Compliance stats or overview]
138 | 
139 | ---
140 | 
141 | ## 💡 Patterns Learned (Cross-Repo)
142 | 
143 | ### [Pattern Name] ([YYYY-MM-DD])
144 | - **Pattern:** [Description]
145 | - **Why:** [Reasoning]
146 | - **Examples:** [Usage examples]
147 | - **Use cases:** [When to apply]
148 | - **Report:** [Link to learning report if exists]
149 | 
150 | ---
151 | 
152 | ## 🛠️ How to Use This File
153 | 
154 | **Session Start (Auto):**
155 | 1. Claude Code loads CLAUDE.md
156 | 2. Finds `@~/.genie/context.md` reference
157 | 3. Executes all `!command` statements
158 | 4. Greets you with:
159 |    - Current focus
160 |    - Where you left off
161 |    - Fresh git context
162 |    - Next queued decision
163 | 
164 | **During Session:**
165 | - Check "Current Focus" to know what you're working on
166 | - Update "Recent Completions" as you finish tasks
167 | - Add decisions to queue (don't present all at once!)
168 | - Track parallel work in "Active Parallel Work" section
169 | 
170 | **Session End:**
171 | - Update "Current Focus" with progress
172 | - Add completions to "Recent Completions"
173 | - Queue any pending decisions
174 | - Learnings auto-captured via /learn command
175 | 
176 | **Decision Management:**
177 | - Add decisions to queue as they arise
178 | - Present ONE at a time from queue
179 | - Remove from queue when resolved
180 | - Never present multiple decisions in parallel (ABCD format)
181 | 
182 | ---
183 | 
184 | ## 🎯 Session Greeting Template
185 | 
186 | When you start a new session, Claude Code greets like this:
187 | 
188 | > "Hey {{USER_NAME}}! 👋
189 | >
190 | > **Current focus:** [from Current Focus section]
191 | > **Where we left off:** [last item from Recent Completions]
192 | > **Branch:** [from !git branch]
193 | > **Status:** [summary from !git status]
194 | >
195 | > [If decision queued]: **Next up:** Decision 1 about [topic]. Ready to discuss?
196 | > [If no decision]: Ready to continue or switch focus?"
197 | 
198 | This ensures:
199 | - ✅ Immediate context restoration
200 | - ✅ Fresh runtime state
201 | - ✅ Clear continuation point
202 | - ✅ No replanning needed
203 | - ✅ Relationship continuity
204 | 
205 | ---
206 | 
207 | **System Status:** ✅ ACTIVE
208 | 
209 | **This file location:** `~/.genie/context.md` (user-local, cross-repo)
210 | 
211 | **Loaded via:** `@~/.genie/context.md` in CLAUDE.md (line 3)
212 | 
213 | **Next evolution:** [Your ideas for improving this system]
214 | 
215 | ---
216 | 
217 | 🧞 **Session continuity system active!** No more amnesia. Let's build. ✨
218 | 


--------------------------------------------------------------------------------
/.genie/scripts/helpers/validate-links.js:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env node
  2 | 
  3 | /**
  4 |  * Validate Markdown Links Helper
  5 |  *
  6 |  * Check markdown links for broken references (files and anchors).
  7 |  * Detects [text](path) links pointing to non-existent files or anchors.
  8 |  *
  9 |  * Usage:
 10 |  *   node validate-links.js <file-path>     # Check links in file
 11 |  *   node validate-links.js <directory>     # Check all .md files in directory
 12 |  *
 13 |  * Output:
 14 |  *   <file>:<line>: Broken link [text](path) - File not found
 15 |  *   <file>:<line>: Broken link [text](path#anchor) - Anchor not found
 16 |  */
 17 | 
 18 | const fs = require('fs');
 19 | const path = require('path');
 20 | 
 21 | /**
 22 |  * Extract markdown links from text
 23 |  * Returns: [{ text, href, line }]
 24 |  */
 25 | function extractLinks(content) {
 26 |   const lines = content.split('\n');
 27 |   const links = [];
 28 |   const linkRegex = /\[([^\]]+)\]\(([^)]+)\)/g;
 29 | 
 30 |   lines.forEach((line, idx) => {
 31 |     let match;
 32 |     while ((match = linkRegex.exec(line)) !== null) {
 33 |       const text = match[1];
 34 |       const href = match[2];
 35 | 
 36 |       // Skip external URLs
 37 |       if (href.startsWith('http://') || href.startsWith('https://')) {
 38 |         continue;
 39 |       }
 40 | 
 41 |       links.push({ text, href, line: idx + 1 });
 42 |     }
 43 |   });
 44 | 
 45 |   return links;
 46 | }
 47 | 
 48 | /**
 49 |  * Check if file exists
 50 |  */
 51 | function fileExists(filePath, basePath) {
 52 |   const fullPath = path.resolve(path.dirname(basePath), filePath);
 53 |   return fs.existsSync(fullPath);
 54 | }
 55 | 
 56 | /**
 57 |  * Check if anchor exists in file
 58 |  */
 59 | function anchorExists(filePath, anchor, basePath) {
 60 |   try {
 61 |     const fullPath = path.resolve(path.dirname(basePath), filePath);
 62 |     const content = fs.readFileSync(fullPath, 'utf-8');
 63 | 
 64 |     // Convert anchor to heading format
 65 |     // #my-heading → ## My Heading or ### My Heading, etc.
 66 |     const headingText = anchor.toLowerCase().replace(/-/g, ' ');
 67 |     const headingRegex = new RegExp(`^#+\\s+${headingText.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}`, 'im');
 68 | 
 69 |     return headingRegex.test(content);
 70 |   } catch (err) {
 71 |     return false;
 72 |   }
 73 | }
 74 | 
 75 | /**
 76 |  * Validate links in file
 77 |  */
 78 | function validateFile(filePath) {
 79 |   try {
 80 |     const content = fs.readFileSync(filePath, 'utf-8');
 81 |     const links = extractLinks(content);
 82 |     const issues = [];
 83 | 
 84 |     links.forEach(({ text, href, line }) => {
 85 |       // Split href into path and anchor
 86 |       const [linkPath, anchor] = href.split('#');
 87 | 
 88 |       // Check if it's just an anchor (same file)
 89 |       if (!linkPath && anchor) {
 90 |         if (!anchorExists(filePath, anchor, filePath)) {
 91 |           issues.push({
 92 |             file: filePath,
 93 |             line,
 94 |             text,
 95 |             href,
 96 |             error: `Anchor not found: #${anchor}`,
 97 |           });
 98 |         }
 99 |         return;
100 |       }
101 | 
102 |       // Check if file exists
103 |       if (!fileExists(linkPath, filePath)) {
104 |         issues.push({
105 |           file: filePath,
106 |           line,
107 |           text,
108 |           href,
109 |           error: 'File not found',
110 |         });
111 |         return;
112 |       }
113 | 
114 |       // If anchor specified, check if it exists in target file
115 |       if (anchor && !anchorExists(linkPath, anchor, filePath)) {
116 |         issues.push({
117 |           file: filePath,
118 |           line,
119 |           text,
120 |           href,
121 |           error: `Anchor not found: #${anchor}`,
122 |         });
123 |       }
124 |     });
125 | 
126 |     return issues;
127 |   } catch (err) {
128 |     return [{ file: filePath, error: `Failed to read file: ${err.message}` }];
129 |   }
130 | }
131 | 
132 | /**
133 |  * Validate all .md files in directory
134 |  */
135 | function validateDirectory(dirPath) {
136 |   const allIssues = [];
137 | 
138 |   function scanDir(dir) {
139 |     const entries = fs.readdirSync(dir, { withFileTypes: true });
140 | 
141 |     entries.forEach(entry => {
142 |       const fullPath = path.join(dir, entry.name);
143 | 
144 |       if (entry.isDirectory() && !entry.name.startsWith('.')) {
145 |         scanDir(fullPath);
146 |       } else if (entry.isFile() && entry.name.endsWith('.md')) {
147 |         const issues = validateFile(fullPath);
148 |         allIssues.push(...issues);
149 |       }
150 |     });
151 |   }
152 | 
153 |   scanDir(dirPath);
154 |   return allIssues;
155 | }
156 | 
157 | /**
158 |  * Main
159 |  */
160 | function main() {
161 |   const args = process.argv.slice(2);
162 | 
163 |   if (args.length === 0) {
164 |     console.error(`
165 | Usage:
166 |   node validate-links.js <file-path>     # Check links in single file
167 |   node validate-links.js <directory>     # Check all .md files recursively
168 | 
169 | Output:
170 |   <file>:<line>: Broken link [text](path) - error description
171 | 
172 | Exit code:
173 |   0 = All links valid
174 |   1 = Broken links found
175 | `);
176 |     process.exit(1);
177 |   }
178 | 
179 |   const target = args[0];
180 | 
181 |   if (!fs.existsSync(target)) {
182 |     console.error(`Error: Path not found: ${target}`);
183 |     process.exit(1);
184 |   }
185 | 
186 |   const stat = fs.statSync(target);
187 |   const issues = stat.isDirectory()
188 |     ? validateDirectory(target)
189 |     : validateFile(target);
190 | 
191 |   if (issues.length === 0) {
192 |     console.log('All links valid');
193 |     process.exit(0);
194 |   }
195 | 
196 |   issues.forEach(issue => {
197 |     if (issue.line) {
198 |       console.log(`${issue.file}:${issue.line}: Broken link [${issue.text}](${issue.href}) - ${issue.error}`);
199 |     } else {
200 |       console.log(`${issue.file}: ${issue.error}`);
201 |     }
202 |   });
203 | 
204 |   process.exit(1);
205 | }
206 | 
207 | main();
208 | 


--------------------------------------------------------------------------------
/.genie/scripts/helpers/bullet-counter.js:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env node
  2 | 
  3 | /**
  4 |  * Bullet Counter Updater
  5 |  *
  6 |  * Find and update helpful/harmful counters for learning bullets.
  7 |  *
  8 |  * Usage:
  9 |  *   genie helper bullet-counter ID --helpful
 10 |  *   genie helper bullet-counter ID --harmful
 11 |  *   genie helper bullet-counter ID (show current counters)
 12 |  */
 13 | 
 14 | const fs = require('fs');
 15 | const path = require('path');
 16 | const { exec } = require('child_process');
 17 | const { promisify } = require('util');
 18 | 
 19 | const execAsync = promisify(exec);
 20 | 
 21 | /**
 22 |  * Find bullet by ID across all markdown files
 23 |  * Returns: { file, line, content, helpful, harmful }
 24 |  */
 25 | function findBullet(id) {
 26 |   const searchPath = path.join(process.cwd(), '.genie');
 27 | 
 28 |   // Use ripgrep to find the bullet
 29 |   const pattern = `^- \\[${id}\\] helpful=(\\d+) harmful=(\\d+):`;
 30 | 
 31 |   try {
 32 |     const { execSync } = require('child_process');
 33 |     const result = execSync(
 34 |       `rg -n "${pattern}" "${searchPath}"`,
 35 |       { encoding: 'utf-8' }
 36 |     ).trim();
 37 | 
 38 |     if (!result) {
 39 |       return null;
 40 |     }
 41 | 
 42 |     // Parse result: file:line:content
 43 |     const match = result.match(/^([^:]+):(\d+):(.+)$/);
 44 |     if (!match) {
 45 |       return null;
 46 |     }
 47 | 
 48 |     const [, file, lineNum, content] = match;
 49 | 
 50 |     // Extract counters from content
 51 |     const counterMatch = content.match(/helpful=(\d+) harmful=(\d+)/);
 52 |     if (!counterMatch) {
 53 |       return null;
 54 |     }
 55 | 
 56 |     return {
 57 |       file: file,
 58 |       line: parseInt(lineNum, 10),
 59 |       content: content,
 60 |       helpful: parseInt(counterMatch[1], 10),
 61 |       harmful: parseInt(counterMatch[2], 10)
 62 |     };
 63 |   } catch (err) {
 64 |     // rg returns exit code 1 when no matches found
 65 |     if (err.status === 1) {
 66 |       return null;
 67 |     }
 68 |     throw err;
 69 |   }
 70 | }
 71 | 
 72 | /**
 73 |  * Update bullet counter in file
 74 |  */
 75 | function updateBulletCounter(bullet, incrementHelpful, incrementHarmful) {
 76 |   const newHelpful = bullet.helpful + (incrementHelpful ? 1 : 0);
 77 |   const newHarmful = bullet.harmful + (incrementHarmful ? 1 : 0);
 78 | 
 79 |   // Read file
 80 |   const content = fs.readFileSync(bullet.file, 'utf-8');
 81 |   const lines = content.split('\n');
 82 | 
 83 |   // Update the line (1-indexed to 0-indexed)
 84 |   const lineIndex = bullet.line - 1;
 85 |   const oldLine = lines[lineIndex];
 86 | 
 87 |   // Replace counters in the line
 88 |   const newLine = oldLine.replace(
 89 |     /helpful=(\d+) harmful=(\d+)/,
 90 |     `helpful=${newHelpful} harmful=${newHarmful}`
 91 |   );
 92 | 
 93 |   if (oldLine === newLine) {
 94 |     console.error('Warning: No change detected');
 95 |     return bullet;
 96 |   }
 97 | 
 98 |   // Write updated content
 99 |   lines[lineIndex] = newLine;
100 |   fs.writeFileSync(bullet.file, lines.join('\n'));
101 | 
102 |   return {
103 |     ...bullet,
104 |     content: newLine,
105 |     helpful: newHelpful,
106 |     harmful: newHarmful
107 |   };
108 | }
109 | 
110 | /**
111 |  * Display bullet info
112 |  */
113 | function displayBullet(bullet) {
114 |   console.log(JSON.stringify({
115 |     file: path.relative(process.cwd(), bullet.file),
116 |     line: bullet.line,
117 |     helpful: bullet.helpful,
118 |     harmful: bullet.harmful,
119 |     content: bullet.content.trim()
120 |   }, null, 2));
121 | }
122 | 
123 | /**
124 |  * Main CLI
125 |  */
126 | async function main() {
127 |   const args = process.argv.slice(2);
128 | 
129 |   // Help
130 |   if (args.length === 0 || args.includes('--help') || args.includes('-h')) {
131 |     console.log('Usage:');
132 |     console.log('  genie helper bullet-counter ID');
133 |     console.log('    Show current counters for bullet');
134 |     console.log('');
135 |     console.log('  genie helper bullet-counter ID --helpful');
136 |     console.log('    Increment helpful counter');
137 |     console.log('');
138 |     console.log('  genie helper bullet-counter ID --harmful');
139 |     console.log('    Increment harmful counter');
140 |     console.log('');
141 |     console.log('Examples:');
142 |     console.log('  $ genie helper bullet-counter learn-042');
143 |     console.log('  {');
144 |     console.log('    "file": ".genie/spells/learn.md",');
145 |     console.log('    "line": 356,');
146 |     console.log('    "helpful": 5,');
147 |     console.log('    "harmful": 0');
148 |     console.log('  }');
149 |     console.log('');
150 |     console.log('  $ genie helper bullet-counter learn-042 --helpful');
151 |     console.log('  Updated: helpful=6 harmful=0');
152 |     return;
153 |   }
154 | 
155 |   const id = args[0];
156 |   const incrementHelpful = args.includes('--helpful');
157 |   const incrementHarmful = args.includes('--harmful');
158 | 
159 |   if (!id) {
160 |     console.error('Error: Bullet ID required');
161 |     console.error('Usage: genie helper bullet-counter ID [--helpful|--harmful]');
162 |     process.exit(1);
163 |   }
164 | 
165 |   // Find bullet
166 |   const bullet = findBullet(id);
167 | 
168 |   if (!bullet) {
169 |     console.error(`Error: Bullet [${id}] not found`);
170 |     console.error('');
171 |     console.error('Searched in: .genie/');
172 |     console.error('Pattern: - [ID] helpful=N harmful=M: content');
173 |     console.error('');
174 |     console.error('Tip: Use "genie helper bullet-find" to search for bullets');
175 |     process.exit(1);
176 |   }
177 | 
178 |   // Show current state
179 |   if (!incrementHelpful && !incrementHarmful) {
180 |     displayBullet(bullet);
181 |     return;
182 |   }
183 | 
184 |   // Update counter
185 |   const updated = updateBulletCounter(bullet, incrementHelpful, incrementHarmful);
186 | 
187 |   console.log(`Updated: helpful=${updated.helpful} harmful=${updated.harmful}`);
188 |   console.log(`File: ${path.relative(process.cwd(), updated.file)}:${updated.line}`);
189 | }
190 | 
191 | main().catch(err => {
192 |   console.error('ERROR:', err.message);
193 |   process.exit(1);
194 | });
195 | 


--------------------------------------------------------------------------------