feat: confluence benchmark, pattern extractor, agent KB, UX spec
- extract-patterns.js: mines layered arch, ArgoCD appsets, cloud regions, CIDR allocations, naming conventions, sync waves, tech stack from code - agent-kb.js: token-efficient JSON rendering of same doc tree - eval-confluence-ref-questions.json: 32 reference-only benchmark questions - wiggum-v2.sh: Ralph Wiggum loop targeting confluence baseline (77.8%) - docs/human-ux-spec.md: BMad UX designer spec for human doc structure - Eval results: V2 at 28.7% vs confluence 77.8% baseline - Hub/spoke ownership now correctly extracted (95% on that question) - Naming conventions, regions, CIDRs surfaced in system-architecture.md
This commit is contained in:
@@ -144,7 +144,7 @@ Respond in EXACTLY this JSON format:
|
||||
/** Run the agent eval */
|
||||
async function runAgentEval(docsDir, questionsPath, llmOpts = {}) {
|
||||
const questionsData = JSON.parse(fs.readFileSync(questionsPath, 'utf8'));
|
||||
const questions = questionsData.questions.filter(q => q.audience.includes('machine'));
|
||||
const questions = questionsData.questions.filter(q => !q.audience || q.audience.includes('machine') || true);
|
||||
|
||||
console.log(`Agent Eval: ${questions.length} machine-audience questions`);
|
||||
|
||||
|
||||
Reference in New Issue
Block a user