bd sync: 2026-01-09 17:32:23

2026-01-09 17:32:23 -08:00 · 2026-01-09 17:32:23 -08:00 · e367be6cb6
parent ec2d856c05
commit e367be6cb6
2 changed files with 3 additions and 3 deletions
--- a/.beads/issues.jsonl
+++ b/.beads/issues.jsonl
@ -80,7 +80,7 @@
 {"id":"skills-ebl","title":"Benchmark vision model UI understanding","description":"## Goal\nMeasure how well vision models can answer UI questions from screenshots.\n\n## Test cases\n1. **Element location**: \"Where is the Save button?\" → coordinates\n2. **Element identification**: \"What buttons are visible?\" → list\n3. **State detection**: \"Is the checkbox checked?\" → boolean\n4. **Text extraction**: \"What does the error message say?\" → text\n5. **Layout understanding**: \"What's in the sidebar?\" → structure\n\n## Metrics\n- Accuracy: Does the answer match ground truth?\n- Precision: How close are coordinates to actual element centers?\n- Latency: Time from query to response\n- Cost: Tokens consumed per query\n\n## Prompt engineering questions\n- Does adding a grid overlay help coordinate precision?\n- What prompt format gives most actionable coordinates?\n- Can we get bounding boxes vs point coordinates?\n\n## Comparison baseline\n- Manual annotation of test screenshots\n- AT-SPI data (once enabled) as ground truth\n\n## Depends on\n- Test screenshots from real apps\n- Ground truth annotations","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-17T14:13:10.038933798-08:00","updated_at":"2025-12-29T15:26:19.822655148-05:00","closed_at":"2025-12-29T15:26:19.822655148-05:00","close_reason":"Benchmark complete. Vision models excellent for semantic understanding, approximate for coordinates. Recommend hybrid AT-SPI + vision. See docs/research/vision-ui-benchmark-2025-12-29.md"}
 {"id":"skills-f2p","title":"Skills + Molecules Integration","description":"Integrate skills with beads molecules system.\n\nDesign work tracked in dotfiles (dotfiles-jjb).\n\nComponents:\n- Checklist support (lightweight skills)\n- Audit integration (bd audit for skill execution)\n- Skill frontmatter for triggers/tracking\n- Proto packaging alongside skills\n\nSee: ~/proj/dotfiles ADR work","status":"closed","priority":2,"issue_type":"epic","created_at":"2025-12-23T17:58:55.999438985-05:00","updated_at":"2025-12-23T19:22:38.577280129-05:00","closed_at":"2025-12-23T19:22:38.577280129-05:00","close_reason":"Superseded by skills-4u0 (migrated from dotfiles)","dependencies":[{"issue_id":"skills-f2p","depends_on_id":"skills-vpy","type":"blocks","created_at":"2025-12-23T17:59:17.976956454-05:00","created_by":"daemon"},{"issue_id":"skills-f2p","depends_on_id":"skills-u3d","type":"blocks","created_at":"2025-12-23T17:59:18.015216054-05:00","created_by":"daemon"}]}
 {"id":"skills-fo3","title":"Compare WORKFLOWS.md with upstream","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-03T20:15:54.283175561-08:00","updated_at":"2025-12-03T20:19:28.897037199-08:00","closed_at":"2025-12-03T20:19:28.897037199-08:00","dependencies":[{"issue_id":"skills-fo3","depends_on_id":"skills-ebh","type":"discovered-from","created_at":"2025-12-03T20:15:54.286009672-08:00","created_by":"daemon","metadata":"{}"}]}
-{"id":"skills-fqu","title":"Research: Agent capability matrix","description":"Document what each agent can and cannot do for cross-agent design decisions.\n\nAgents to cover:\n- Claude Code (claude CLI)\n- Gemini (gemini CLI / AI Studio)\n- OpenCode\n- Codex (OpenAI)\n\nCapabilities to assess:\n- Hooks / lifecycle events\n- Subagent spawning\n- File system access (paths, restrictions)\n- CLI tool execution\n- State persistence\n- Context window / memory\n\nOutput: Matrix showing capability parity and gaps","status":"in_progress","priority":2,"issue_type":"task","created_at":"2026-01-09T17:14:20.541961958-08:00","created_by":"dan","updated_at":"2026-01-09T17:16:13.794753056-08:00"}
+{"id":"skills-fqu","title":"Research: Agent capability matrix","description":"Document what each agent can and cannot do for cross-agent design decisions.\n\nAgents to cover:\n- Claude Code (claude CLI)\n- Gemini (gemini CLI / AI Studio)\n- OpenCode\n- Codex (OpenAI)\n\nCapabilities to assess:\n- Hooks / lifecycle events\n- Subagent spawning\n- File system access (paths, restrictions)\n- CLI tool execution\n- State persistence\n- Context window / memory\n\nOutput: Matrix showing capability parity and gaps","status":"closed","priority":2,"issue_type":"task","created_at":"2026-01-09T17:14:20.541961958-08:00","created_by":"dan","updated_at":"2026-01-09T17:32:23.730556916-08:00","closed_at":"2026-01-09T17:32:23.730556916-08:00","close_reason":"Capability matrix complete: docs/research/agent-capability-matrix.md"}
 {"id":"skills-fvc","title":"Code Review: {{target}}","description":"Multi-lens code review workflow for {{target}}.\n\n## Philosophy\nThe LLM stays in the loop at every step - this is agent-assisted review, not automated parsing. The agent applies judgment about what's worth filing, how to prioritize, and what context to include.\n\n## Variables\n- target: File or directory to review\n\n## Workflow\n1. Explore codebase to find candidates (if target is directory)\n2. Run lenses via orch consensus for multi-model perspective\n3. Analyze findings - LLM synthesizes across lenses and models\n4. File issues with judgment - group related, set priorities, add context\n5. Summarize for digest\n\n## Lenses Available\n- bloat: size, complexity, SRP violations\n- smells: readability, naming, control flow\n- dead-code: unused, unreachable, obsolete\n- redundancy: duplication, YAGNI, parallel systems","status":"closed","priority":2,"issue_type":"epic","created_at":"2025-12-25T10:10:57.652098447-05:00","updated_at":"2025-12-26T23:22:41.408582818-05:00","closed_at":"2025-12-26T23:22:41.408582818-05:00","close_reason":"Replaced by /code-review skill","labels":["template"]}
 {"id":"skills-fvc.1","title":"Run bloat lens on {{target}}","description":"Run bloat review lens via orch:\n\n```bash\norch consensus \"$(cat ~/.config/lenses/bloat.md)\" flash gemini --file {{target}} --mode open\n```\n\nLook for: file size, function length, complexity, SRP violations.\nRecord findings for later filing.","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-25T10:13:59.789715667-05:00","updated_at":"2025-12-26T23:22:41.416754154-05:00","closed_at":"2025-12-26T23:22:41.416754154-05:00","close_reason":"Replaced by /code-review skill","dependencies":[{"issue_id":"skills-fvc.1","depends_on_id":"skills-fvc","type":"parent-child","created_at":"2025-12-25T10:13:59.80248308-05:00","created_by":"daemon"}]}
 {"id":"skills-fvc.2","title":"Run smells lens on {{target}}","description":"Run smells review lens via orch:\n\n```bash\norch consensus \"$(cat ~/.config/lenses/smells.md)\" flash gemini --file {{target}} --mode open\n```\n\nLook for: naming issues, control flow smells, data smells, structural issues.\nRecord findings for later filing.","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-25T10:16:13.977562568-05:00","updated_at":"2025-12-26T23:22:41.423564011-05:00","closed_at":"2025-12-26T23:22:41.423564011-05:00","close_reason":"Replaced by /code-review skill","dependencies":[{"issue_id":"skills-fvc.2","depends_on_id":"skills-fvc","type":"parent-child","created_at":"2025-12-25T10:16:13.989662453-05:00","created_by":"daemon"}]}
@ -95,7 +95,7 @@
 {"id":"skills-gq9","title":"Define structured skill reference schema","description":"Replace simple skill: string with structured object.\n\nCurrent (too weak):\n  skill: worklog\n\nProposed:\n  skill:\n    id: worklog\n    ref: \"git+file://...#worklog@abc123\"\n    inputs:\n      session: \"{{session}}\"\n    expects:\n      files: [\"docs/worklogs/{{session}}.org\"]\n\nFrom orch consensus: both GPT and Gemini flagged this as critical gap.\nNo mechanism to pass args from molecule to skill.","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-23T19:49:30.529899123-05:00","updated_at":"2025-12-28T22:46:28.371352259-05:00","closed_at":"2025-12-28T22:46:28.371352259-05:00","close_reason":"Deferred: structured schema was for molecule→skill integration. Current approach (agent reads SKILL.md directly) works well. Skills as entrypoints are simpler than protos. Revisit if programmatic workflows become active.","dependencies":[{"issue_id":"skills-gq9","depends_on_id":"skills-oes","type":"blocks","created_at":"2025-12-23T19:50:10.337111856-05:00","created_by":"daemon"},{"issue_id":"skills-gq9","depends_on_id":"skills-8y6","type":"blocks","created_at":"2025-12-23T19:50:10.388301727-05:00","created_by":"daemon"}]}
 {"id":"skills-gvj","title":"Orch-in-the-Middle: LSP proxy for multi-model refactors","description":"Write an LSP proxy (Go/Rust) that:\n- Intercepts rename/code-action requests from editor\n- Sends to Orch for multi-model proposals\n- Validates proposals against real headless LSP\n- Returns winning WorkspaceEdit to editor\n\nGet consensus refactoring inside VS Code/Neovim by configuring LSP server path in home-manager.","status":"closed","priority":4,"issue_type":"feature","created_at":"2025-12-24T02:29:56.623189042-05:00","updated_at":"2025-12-29T14:37:35.360129462-05:00","closed_at":"2025-12-29T14:37:35.360129462-05:00","close_reason":"Parked: waiting on gastown (Steve Yegge's orchestration layer for beads). Revisit when gastown lands."}
 {"id":"skills-h9f","title":"spec-review: Balance negativity bias in prompts","description":"'Be critical' and 'devil's advocate' can bias toward over-flagging without acknowledging what's good.\n\nAdd:\n- 'List top 3 strongest parts of the document'\n- 'Call out where document is sufficiently clear/testable'\n- Categorize :against concerns as confirmed/plausible/rejected","status":"closed","priority":3,"issue_type":"task","created_at":"2025-12-15T00:23:26.418087998-08:00","updated_at":"2025-12-15T14:07:39.520818417-08:00","closed_at":"2025-12-15T14:07:39.520818417-08:00"}
-{"id":"skills-hf1","title":"Cross-agent skill portability and quality gates","description":"Design and implement patterns for skills that work across multiple AI agents (Claude, Gemini, OpenCode).\n\n## Problem Statement\n\nWe want skills and quality enforcement to work regardless of which agent is:\n- The primary orchestrator\n- The worker agent\n- The reviewer agent\n\nCurrent blockers:\n- Claude Code hooks (Stop, etc.) don't exist in other agents\n- Path restrictions differ (Gemini can't read ~/.claude/skills/)\n- Subagent spawning differs across agents\n- alice/idle quality gate is Claude-specific\n\n## Goals\n\n1. **Portable skills** - Same skill works in Claude, Gemini, OpenCode\n2. **Portable quality gates** - Adversarial review pattern across agents\n3. **Flexible orchestration** - Any agent can orchestrate, any can be worker/reviewer\n\n## Key Research Areas\n\n- Dual-publish pattern (done: ADR-005)\n- Cross-agent quality gate mechanisms\n- State management (jwz vs beads vs other)\n- Protocol vs mechanical enforcement trade-offs\n- Orchestrator pattern design\n\n## Related Work\n\n- emes ecosystem (alice, jwz, tissue)\n- Our dual-publish implementation\n- orch multi-model consensus","status":"open","priority":2,"issue_type":"epic","created_at":"2026-01-09T17:13:48.116438862-08:00","created_by":"dan","updated_at":"2026-01-09T17:13:54.006968189-08:00","dependencies":[{"issue_id":"skills-hf1","depends_on_id":"skills-3gk","type":"blocks","created_at":"2026-01-09T17:14:26.901205948-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-fqu","type":"blocks","created_at":"2026-01-09T17:14:26.940496671-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-3ja","type":"blocks","created_at":"2026-01-09T17:14:26.97832902-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-mjf","type":"blocks","created_at":"2026-01-09T17:14:27.011077849-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-6fu","type":"blocks","created_at":"2026-01-09T17:14:27.045750539-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-bo8","type":"blocks","created_at":"2026-01-09T17:14:27.150392041-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-5kv","type":"blocks","created_at":"2026-01-09T17:14:27.192813254-08:00","created_by":"dan"}]}
+{"id":"skills-hf1","title":"Cross-agent skill portability and quality gates","description":"Design and implement patterns for skills that work across multiple AI agents (Claude, Gemini, OpenCode).\n\n## Problem Statement\n\nWe want skills and quality enforcement to work regardless of which agent is:\n- The primary orchestrator\n- The worker agent\n- The reviewer agent\n\nCurrent blockers:\n- Claude Code hooks (Stop, etc.) don't exist in other agents\n- Path restrictions differ (Gemini can't read ~/.claude/skills/)\n- Subagent spawning differs across agents\n- alice/idle quality gate is Claude-specific\n\n## Goals\n\n1. **Portable skills** - Same skill works in Claude, Gemini, OpenCode\n2. **Portable quality gates** - Adversarial review pattern across agents\n3. **Flexible orchestration** - Any agent can orchestrate, any can be worker/reviewer\n\n## Key Research Areas\n\n- Dual-publish pattern (done: ADR-005)\n- Cross-agent quality gate mechanisms\n- State management (jwz vs beads vs other)\n- Protocol vs mechanical enforcement trade-offs\n- Orchestrator pattern design\n\n## Related Work\n\n- emes ecosystem (alice, jwz, tissue)\n- Our dual-publish implementation\n- orch multi-model consensus","status":"open","priority":2,"issue_type":"epic","created_at":"2026-01-09T17:13:48.116438862-08:00","created_by":"dan","updated_at":"2026-01-09T17:13:54.006968189-08:00","dependencies":[{"issue_id":"skills-hf1","depends_on_id":"skills-3gk","type":"blocks","created_at":"2026-01-09T17:14:26.901205948-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-fqu","type":"blocks","created_at":"2026-01-09T17:14:26.940496671-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-3ja","type":"blocks","created_at":"2026-01-09T17:14:26.97832902-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-mjf","type":"blocks","created_at":"2026-01-09T17:14:27.011077849-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-6fu","type":"blocks","created_at":"2026-01-09T17:14:27.045750539-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-bo8","type":"blocks","created_at":"2026-01-09T17:14:27.150392041-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-5kv","type":"blocks","created_at":"2026-01-09T17:14:27.192813254-08:00","created_by":"dan"},{"issue_id":"skills-hf1","depends_on_id":"skills-ut4","type":"blocks","created_at":"2026-01-09T17:32:23.828114543-08:00","created_by":"dan"}]}
 {"id":"skills-hgm","title":"Add tests for agent file update logic","description":"File: .specify/scripts/bash/update-agent-context.sh (lines 360-499)\n\nCritical logic with NO test coverage:\n- Malformed agent files (missing sections)\n- Multiple section headers on same line\n- Empty file handling\n- Timestamp update verification\n- State machine correctness\n\nRisk: HIGH - corrupts agent context files on failure\n\nFix:\n- Create test fixtures for various file states\n- Test each state transition\n- Verify idempotency\n\nSeverity: HIGH","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-24T02:51:00.793493549-05:00","updated_at":"2026-01-02T02:12:09.368531967-05:00","closed_at":"2026-01-02T02:12:09.368531967-05:00","close_reason":"33 tests added covering all major code paths. Also fixed bug where Recent Changes section was skipped when preceded by Active Technologies."}
 {"id":"skills-hh2","title":"skill: rename_symbol with LSP + validation","description":"Skill that performs safe renames:\n1. Uses LSP textDocument/rename\n2. Runs formatters\n3. Checks LSP diagnostics post-rename\n4. Opens bead if errors remain\n5. Updates doc references using hover/signatureHelp\n\nInput: new name, scope. Output: clean rename or bead with issues.","status":"open","priority":3,"issue_type":"task","created_at":"2025-12-24T02:29:56.87156069-05:00","updated_at":"2025-12-24T02:29:56.87156069-05:00","dependencies":[{"issue_id":"skills-hh2","depends_on_id":"skills-gga","type":"blocks","created_at":"2025-12-24T02:30:06.583813579-05:00","created_by":"daemon"}]}
 {"id":"skills-hhz","title":"Add doc-review skill","description":"Create skill for doc-review CLI tool (~/proj/doc-review). Tool lints markdown docs for AI agent consumption using Vale + LLM hybrid architecture. Needs: 1) flake.nix in doc-review project, 2) skill SKILL.md, 3) register in availableSkills","status":"closed","priority":2,"issue_type":"task","created_at":"2025-12-30T11:24:41.321478346-05:00","created_by":"dan","updated_at":"2025-12-31T00:00:30.74314365-05:00","closed_at":"2025-12-31T00:00:30.74314365-05:00","close_reason":"doc-review skill created in skills/doc-review/SKILL.md"}
--- a/.beads/last-touched
+++ b/.beads/last-touched
@ -1 +1 @@
-skills-hf1
+skills-ut4