yaijs
diff --git a/‎.prrrc.example.js‎
Lines changed: 53 additions & 1 deletion b/‎.prrrc.example.js‎
Lines changed: 53 additions & 1 deletion
diff --git a/‎AGENTS.md‎
Lines changed: 0 additions & 37 deletions b/‎AGENTS.md‎
Lines changed: 0 additions & 37 deletions
diff --git a/‎CHANGELOG.md‎
Lines changed: 24 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎LICENSE‎
Lines changed: 1 addition & 1 deletion b/‎LICENSE‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md‎
Lines changed: 109 additions & 32 deletions b/‎README.md‎
Lines changed: 109 additions & 32 deletions
@@ -14,6 +14,7 @@ module.exports = {
       endpoint: 'https://integrate.api.nvidia.com/v1',
       apiKeyEnv: 'NVIDIA_API_KEY',
       model: 'meta/llama-3.3-70b-instruct',
+      mode: 'defects',
       prompt: 'Find concrete security vulnerabilities, trust-boundary mistakes, and edge-case failures. Cite files and line numbers.',
       useTools: true,
       maxToolRounds: 8
@@ -24,11 +25,62 @@ module.exports = {
       endpoint: 'https://api.openai.com/v1',
       apiKeyEnv: 'OPENAI_API_KEY',
       timeoutMs: 120000,
+      mode: 'defects',
       structuredOutputMode: 'json_schema',
+      // For GPT-5 models, omit maxOutputTokens unless you need a cap.
+      // OpenAI counts reasoning tokens inside max_completion_tokens.
       model: 'gpt-5-mini',
       prompt: 'Triage the changed code for correctness, regressions, and weak assumptions. Prefer concrete bugs over style.',
       useTools: true,
       maxToolRounds: 6
+    },
+    {
+      name: 'Optional Brainstorm',
+      provider: 'openai',
+      endpoint: 'https://api.openai.com/v1',
+      apiKeyEnv: 'OPENAI_API_KEY',
+      timeoutMs: 120000,
+      mode: 'suggestions',
+      structuredOutputMode: 'json_schema',
+      allowSuggestions: true,
+      maxSuggestions: 2,
+      // If you do set maxOutputTokens on GPT-5, keep it well above the visible output target.
+      model: 'gpt-5-mini',
+      prompt: 'Suggest at most 2 grounded follow-up improvements. Do not repeat defects. Avoid rewrites and generic wishlist items. Every suggestion must have a clear benefit and tradeoff.',
+      useTools: true,
+      maxToolRounds: 4
+    }
+  ],
+  brainstormers: [
+    {
+      name: 'Scope Challenger',
+      provider: 'nvidia-free',
+      endpoint: 'https://integrate.api.nvidia.com/v1',
+      apiKeyEnv: 'NVIDIA_API_KEY',
+      model: 'meta/llama-3.1-70b-instruct',
+      structuredOutputMode: 'json_object',
+      prompt: 'Challenge the concept scope and identify missing constraints, hidden assumptions, and where the MVP should be narrower.',
+      useTools: false
+    },
+    {
+      name: 'Validation Planner',
+      provider: 'nvidia-free',
+      endpoint: 'https://integrate.api.nvidia.com/v1',
+      apiKeyEnv: 'NVIDIA_API_KEY',
+      model: 'meta/llama-3.1-405b-instruct',
+      structuredOutputMode: 'json_object',
+      prompt: 'Turn the concept into validation work: experiments, acceptance checks, and success criteria before implementation starts.',
+      useTools: false
     }
-  ]
+  ],
+  brainstormSynthesis: {
+    name: 'Core Coder',
+    provider: 'nvidia-free',
+    endpoint: 'https://integrate.api.nvidia.com/v1',
+    apiKeyEnv: 'NVIDIA_API_KEY',
+    model: 'meta/llama-3.1-405b-instruct',
+    structuredOutputMode: 'json_object',
+    prompt: 'Synthesize the brainstorm panel into a grounded recommendation, a short priority list, open questions, deferred ideas, and a revised next brief.',
+    useTools: false
+  }
 };
@@ -0,0 +1,24 @@
+## 0.1.0
+
+Initial public release of `prr-cli`.
+
+### Highlights
+
+- Run parallel or sequential PR/code reviews from the CLI against OpenAI-compatible backends.
+- Support reviewer lanes for both `defects` and `suggestions` workflows.
+- Add `prr brainstorm <brief.md>` with a separate `brainstormers` panel for concept and plan review.
+- Support optional `brainstormSynthesis` output that turns panel findings into a prioritized recommendation and revised next brief.
+- Allow tool-enabled reviewers to fetch more file context on demand.
+- Ship structured output support with `json_schema` and `json_object` modes when the provider supports them.
+- Include auto-selection logic that prefers verified elite tool-capable models.
+- Document a strict elite model list backed by live large-prompt and tool-calling validation.
+- Include NVIDIA model probe tooling and experiment helpers for evaluating reviewer/model combinations.
+
+### Release preparation notes
+
+- Default reviewer and experiment tool-enabled models were aligned to verified tool-capable elite models.
+- Packaging was tightened with an explicit npm `files` allowlist.
+- Publishing metadata now includes repository, homepage, and issue tracker links.
+- Live validation passed for both NVIDIA and OpenAI-compatible flows.
+- Live brainstorm validation passed, including synthesis `nextBrief` preservation in the final structured report.
+- GPT-5 configuration guidance was added for `maxOutputTokens` / reasoning-token budgeting.
@@ -1,6 +1,6 @@
 MIT License
 
-Copyright (c) 2026
+Copyright (c) 2026 Engin Ypsilon
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 
@@ -1,6 +1,12 @@
 # prr-cli
 
-`prr` is a Node.js CLI for running parallel code reviews against multiple NVIDIA-hosted language models.
+`prr` is a Node.js CLI for running parallel code reviews and concept brainstorms against OpenAI-compatible language models, including NVIDIA-hosted and OpenAI backends.
+
+## Why multiple reviewers?
+
+Different models often produce code that looks similarly correct on the surface, but they reach that result through different internal strengths, assumptions, and blind spots.
+
+`prr` uses that diversity on purpose: by collecting multiple independent reviews, you increase the chance that one model notices an edge case, risk, or alternative approach that another model would miss.
 
 ## Requirements
 - Node.js 18+
@@ -17,6 +23,14 @@ For local development you can run the CLI without publishing:
 node bin/prr.js review src/**/*.js
 ```
 
+## Fastest way to try `prr`: NVIDIA quick start
+
+Most examples in this repo work well with a free NVIDIA Build account.
+
+1. Create a free account on NVIDIA: `https://build.nvidia.com/`
+2. After login, go to `https://build.nvidia.com/settings/api-keys` and `Generate API Key`
+3. Copy `.env.example` to `.env`, set `NVIDIA_API_KEY`, then run `node bin/prr.js doctor`
+
 ## API Keys
 `prr` reads API keys from the configured environment variable name, defaulting to `NVIDIA_API_KEY`.
 
@@ -59,10 +73,13 @@ prr review --changed --dry-run
 prr review --resume
 prr review --resume 2026-03-04T10-05-00-000Z
 prr review src/cli.js --dry-run --verbose
-prr guide coder
+prr brainstorm ./concept-brief.md
+prr brainstorm ./concept-brief.md --dry-run --verbose
+prr brainstorm ./concept-brief.md --no-synthesis
+prr brainstorm ./concept-brief.md --config .prrrc.brainstorm.js --json
 prr doctor
 prr doctor --request
-prr review examples/yai-timeout/yai-timeout.js --context-file examples/yai-timeout/review.instructions.md
+prr review examples/yai-timeout/yai-timeout.js --context-file ./review-context.md
 prr review --config .prrrc.js src --json
 prr experiment run src/**/*.js --preset smoke
 prr auto run --changed --json
@@ -103,14 +120,52 @@ module.exports = {
       provider: 'openai',
       endpoint: 'https://api.openai.com/v1',
       apiKeyEnv: 'OPENAI_API_KEY',
+      mode: 'defects',
       model: 'some/model',
-      prompt: 'Review this code with custom rules.',
+      prompt: 'Review this code for concrete bugs and risks with custom rules.',
       maxOutputTokens: 2048,
       useTools: true,
       maxToolRounds: 6,
       structuredOutputMode: 'json_schema'
+    },
+    {
+      name: 'Optional Brainstorm',
+      provider: 'openai',
+      endpoint: 'https://api.openai.com/v1',
+      apiKeyEnv: 'OPENAI_API_KEY',
+      mode: 'suggestions',
+      model: 'some/model',
+      prompt: 'Suggest at most 3 grounded follow-up improvements. Do not repeat defects. Include a clear benefit and tradeoff for each suggestion.',
+      useTools: true,
+      maxToolRounds: 4,
+      allowSuggestions: true,
+      maxSuggestions: 3,
+      structuredOutputMode: 'json_schema'
+    }
+  ],
+  brainstormers: [
+    {
+      name: 'Scope Challenger',
+      model: 'meta/llama-3.1-70b-instruct',
+      structuredOutputMode: 'json_object',
+      prompt: 'Challenge the concept scope and identify missing constraints.',
+      useTools: false
+    },
+    {
+      name: 'Validation Planner',
+      model: 'meta/llama-3.1-405b-instruct',
+      structuredOutputMode: 'json_object',
+      prompt: 'Turn the concept into validation work before implementation starts.',
+      useTools: false
     }
-  ]
+  ],
+  brainstormSynthesis: {
+    name: 'Core Coder',
+    model: 'meta/llama-3.1-405b-instruct',
+    structuredOutputMode: 'json_object',
+    prompt: 'Synthesize the brainstorm panel into a grounded recommendation and revised next brief.',
+    useTools: false
+  }
 };
 ```
 
@@ -127,31 +182,63 @@ Configuration notes:
 - `timeoutMs`: provider request timeout in milliseconds
 - `structuredOutput`: set to `false` to force plain-text parsing even when the provider preset supports structured responses
 - `structuredOutputMode`: override with `json_schema` or `json_object` when the provider supports it
-- `--context-file`: inject a coder-prepared markdown briefing into the review request
+- `--context-file`: inject an optional markdown context file into the review request
 - `maxOutputTokens`: optional per-reviewer cap; omit it to let the provider decide
 - `useTools`: whether the reviewer may fetch file contents on demand
 - `maxToolRounds`: optional per-reviewer cap for tool-call rounds
+- `mode`: reviewer lane, either `defects` or `suggestions` (default `defects`)
+- `allowSuggestions`: when `true`, structured reviewers may return a separate `suggestions` array in addition to defect `findings` (`mode: 'suggestions'` turns this on automatically)
+- `maxSuggestions`: optional cap for reviewer suggestions when `allowSuggestions` is enabled
+- `brainstormers`: separate model panel for `prr brainstorm`, useful for broader or cheaper no-tools model fans
+- `brainstormSynthesis`: optional single-model synthesis stage that runs after `brainstormers` and produces a tighter recommendation plus a revised markdown next brief
 
 `reviewSharing` is only effective in `sequential` mode. In `parallel` mode, reviewers run concurrently and do not have prior results to inspect.
 When reviewers run with `useTools: false`, increase `contextMaxChars` if you need more inline source context for larger files.
+`mode: 'suggestions'` makes the reviewer an explicit improvement lane with suggestion-focused prompting and metadata. Structured output still gives the cleanest separation because it can return a dedicated `suggestions` array.
+Recommended pattern: keep normal reviewers in `mode: 'defects'`, then add a separate optional reviewer in `mode: 'suggestions'` with a low `maxSuggestions` cap.
+For GPT-5-family models, `maxOutputTokens` maps to `max_completion_tokens`, which includes reasoning tokens as well as visible output. If you set it too low, the model can spend the whole budget reasoning and return an empty visible response. Prefer leaving it unset or keeping it comfortably above the expected final output size.
 
 Reviewer transport overrides inherit from the global config by default, but each reviewer can override:
 - `provider`
 - `endpoint`
 - `apiKeyEnv`
 - `timeoutMs`
 - `structuredOutputMode`
+- `mode`
+- `allowSuggestions`
+- `maxSuggestions`
 
 That means one review run can mix free NVIDIA-hosted models with paid OpenAI-compatible backends.
+For brainstorming, it is often cleaner to keep a dedicated config such as `.prrrc.brainstorm.js` and pass it with `--config`.
+
+## Brainstorm Mode
+`prr brainstorm <brief.md>` runs a concept-review panel against a markdown brief instead of source files.
+
+- input is a markdown concept note, design draft, or implementation plan
+- models come from `brainstormers`, separate from normal `reviewers`
+- an optional `brainstormSynthesis` reviewer can consolidate the panel into a prioritized recommendation and revised markdown next brief
+- no file selection, diff parsing, or tool calls are required
+- this makes it practical to fan out across many cheaper NVIDIA-hosted models
+
+Typical flow:
+- draft `concept-brief.md`
+- run `prr brainstorm concept-brief.md`
+- review the optional synthesis output and merge the concrete findings back into the brief
+- re-run until the concept is tighter
+- start implementation and switch to normal `prr review`
 
 ## Output
 The default report is Markdown with:
 - timestamp
-- analyzed files and line counts
-- one section per reviewer
-- summary totals for findings, errors, and duration
+- one section per brainstormer
+- combined concept findings sections
+- optional synthesis section with priorities and a draft next brief
+- summary totals for brainstorm items, synthesis status, errors, and duration
 
 Use `--json` for machine-readable output suitable for automation.
+When synthesis is enabled, `nextBrief` is normalized as markdown text so it can be copied back into the source brief or saved directly for another brainstorm round.
+
+Brainstorm runs are persisted under `.prr/brainstorms/<run-id>/` with the same `request.json`, `progress.json`, per-reviewer results, and final `result.json` pattern as review runs.
 
 Each normal review run is persisted under `.prr/reviews/<run-id>/` with:
 - `request.json`
@@ -164,7 +251,7 @@ Use `--resume` to continue the latest incomplete review run, or `--resume <run-i
 Use `--dry-run` to inspect what would happen without calling the provider:
 - selected files
 - resolved config and execution mode
-- optional coder-prepared context file
+- optional markdown context file
 - context snippets that would be sent
 - reviewer prompts
 - actual batching plan
@@ -182,36 +269,25 @@ When a provider preset supports structured output, `prr` asks for machine-readab
 
 `prr` also builds a deterministic combined-findings view after each run. This deduplicates overlapping findings locally across reviewers before any optional checker/judge stage, so repeated reports do not need another model call just to collapse duplicates.
 
-For programmer-agent handoff, the repository also includes [prrrc.coder.guide.md](prrrc.coder.guide.md). It is a repo-local briefing file for tools like Claude or Codex: summarize changed files, call out missing context that reviewers would otherwise guess, and prepare a focused review task list before running `prr`.
-
-You can print it directly with:
+Use `--context-file` when the reviewer needs short factual context that is not obvious from the code or diff alone, for example intended behavior, constraints, or already-known tradeoffs.
 
-```bash
-prr guide coder
-```
-
-The expected workflow is:
-1. print the guide
-2. create a new `review.instructions.md`
-3. pass that file into `prr`
-
-And inject a prepared briefing directly into review requests:
+Example:
 
 ```bash
 prr review examples/yai-timeout/yai-timeout.js \
-  --context-file examples/yai-timeout/review.instructions.md
+  --context-file ./review-context.md
 ```
 
+A good context file should stay concise and focus on:
+- what changed or what to double-check
+- expected behavior or constraints that are easy to miss
+- intentional tradeoffs that should not be re-raised as defects
+
 Stop rule for review loops:
 - stop when no high-severity findings remain and two consecutive rounds add no materially new concrete defects
 - treat repeated low/info or policy-only findings as closure signal, not as mandatory code churn
 - record intentional tradeoffs and rejected findings before closing the loop
 
-Decision authority:
-- the core-programmer agent may declare a target "done" once the stop rule is satisfied
-- that declaration should include fix/reject rationale and remaining tradeoffs
-- the human operator can always request another round
-
 ## Context Strategy
 The default review path is diff-first. If the target files are inside a Git work tree, `prr` sends diff context first and lets the model request file contents or line ranges only when needed. This reduces prompt size and helps avoid truncating large reviews on smaller context-window models.
 
@@ -231,22 +307,23 @@ The repository includes a first real benchmark target under [examples/yai-timeou
 Useful commands:
 
 ```bash
-prr guide coder
 prr review examples/yai-timeout/yai-timeout.js --dry-run
 prr review examples/yai-timeout/yai-timeout.js
-prr review examples/yai-timeout/yai-timeout.js --context-file examples/yai-timeout/review.instructions.md
+prr review examples/yai-timeout/yai-timeout.js --context-file ./review-context.md
 prr experiment run examples/yai-timeout/yai-timeout.js --preset smoke
 ```
 
-The first live benchmark on `YaiTimeout` showed that a coder-prepared `review.instructions.md` improved review quality and reduced token waste compared with a plain run.
+Early live benchmarks on `YaiTimeout` showed that a short, focused context note improved review quality and reduced token waste compared with a plain run.
 
 The example is now considered closed for this repository cycle: no unresolved high-severity defects remain, and later rounds mostly repeated low-priority or speculative findings.
 
 ## Auto Mode
 `prr auto run` is the first proof-of-concept orchestration step. It currently:
 - resolves explicit files or Git-changed files
 - prefers the latest experiment recommendation when available
+- swaps tool-enabled recommendations to the verified elite list when the recommended model is not tool-verified
 - otherwise runs the configured reviewers
+- falls back to the top elite tool-capable reviewer when recommendation runs fail with connection-only errors
 - applies the local cleanup and quality scoring pass
 - emits a combined JSON or text summary