opsfolio
diff --git a/‎sqlpage/sqlpage.db‎ b/‎sqlpage/sqlpage.db‎
diff --git a/‎support/assurance/qualityfolio/.env-example‎
Lines changed: 4 additions & 0 deletions b/‎support/assurance/qualityfolio/.env-example‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎support/assurance/qualityfolio/README.md‎
Lines changed: 151 additions & 0 deletions b/‎support/assurance/qualityfolio/README.md‎
Lines changed: 151 additions & 0 deletions
diff --git a/‎support/assurance/qualityfolio/ai-chat/.env-example‎
Lines changed: 10 additions & 0 deletions b/‎support/assurance/qualityfolio/ai-chat/.env-example‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎support/assurance/qualityfolio/ai-chat/app/api/chat/route.ts‎
Lines changed: 195 additions & 0 deletions b/‎support/assurance/qualityfolio/ai-chat/app/api/chat/route.ts‎
Lines changed: 195 additions & 0 deletions
@@ -0,0 +1,4 @@
+OPENAI_API_KEY=sk-your-openai-key
+GEMINI_API_KEY=AI-key
+GROQ_API_KEY=gsk_key
+ANTHROPIC_API_KEY=anthropic-key
@@ -0,0 +1,151 @@
+# QualityFolio Chat
+
+A full-stack AI-powered chat application combining **SQLPage**, **LiteLLM**, and a **React-based Assistant UI**, designed to query a Resource Surveillance State Database (RSSD) using natural language.
+
+## Overview
+
+QualityFolio Chat allows users to ask natural language questions about quality data. It uses LiteLLM as an LLM proxy (supporting OpenAI-compatible models including local Ollama models), SQLPage to serve a web UI from SQL, and a React chat widget for the frontend.
+
+---
+
+## Requirements
+
+### System
+
+| Requirement | Version / Notes |
+|---|---|
+| **Node.js** | v18+ |
+| **Python** | 3.10+ |
+| **npm** | v9+ |
+| **SQLPage** | Latest (binary in PATH) |
+| **Spry CLI** | Installed and in PATH |
+| **Ollama** *(optional)* | Required if using local models (e.g. `oss-20b-32K:latest`) |
+
+### Python Packages
+
+Install via pip:
+
+```bash
+pip install 'litellm[proxy]'
+```
+
+Or if using a virtual environment (recommended):
+
+```bash
+python -m venv litellm-venv
+source litellm-venv/bin/activate
+pip install 'litellm[proxy]'
+```
+
+### Node Packages (Frontend)
+
+Installed automatically via `npm install` inside `assistant-ui-chat/`.
+
+---
+
+## Project Structure
+
+```
+qualityfolio-chat/
+├── assistant-ui-chat/        # React frontend (Assistant UI)
+│   └── ...
+├── sqlpage/
+│   └── sqlpage.js            # SQLPage configuration
+├── dev-src.auto/             # Auto-generated SQLPage sources
+├── litellm_config.yaml       # LiteLLM model & routing config
+├── qualityfolio.md           # Spry source definition
+├── chat-widget-react.js      # Compiled React chat widget
+├── chat-widget-react-index.css
+├── .env                      # Environment variables (API keys, etc.)
+├── .env.example              # Example environment file
+└── poly.sql                  # SQL definitions
+```
+
+---
+
+## Setup & Running
+
+Follow these steps **in order**. Each step should be run in a separate terminal if running concurrently.
+
+### Step 1 — Run Spry Commands
+
+Generate the SQLPage sources from the markdown definition:
+
+```bash
+spry rb run qualityfolio.md
+spry sp spc --fs dev-src.auto --destroy-first --conf sqlpage/sqlpage.js --md qualityfolio.md
+```
+
+### Step 2 — Start SQLPage
+
+Serve the SQLPage web interface:
+
+```bash
+sqlpage
+```
+
+SQLPage will serve from the `dev-src.auto/` directory. Visit `http://localhost:9227` (or the configured port) in your browser.
+
+### Step 4 — Start LiteLLM
+
+Load environment variables and start the LiteLLM proxy:
+
+```bash
+source .env && litellm --config litellm_config.yaml
+```
+
+> **Note:** Ensure `.env` contains all required API keys or model endpoint URLs. See `.env.example` for reference.
+
+### Step 5 — Start the Frontend
+
+Install dependencies and run the React dev server:
+
+```bash
+cd assistant-ui-chat
+npm install
+npm run dev
+```
+
+The frontend will be available at `http://localhost:3000` (or as configured).
+
+---
+
+## Environment Variables
+
+Copy `.env.example` to `.env` and fill in your values:
+
+```bash
+cp .env.example .env
+```
+
+Key variables to configure:
+
+| Variable | Description |
+|---|---|
+| `OPENAI_API_KEY` | OpenAI API key (if using OpenAI models) |
+| `OLLAMA_BASE_URL` | Ollama base URL (default: `http://localhost:11434`) |
+| `DATABASE_URL` | Path or connection string for the RSSD database |
+
+---
+
+## Troubleshooting
+
+### `UnboundLocalError: cannot access local variable 'completion_output'`
+
+This is a known bug in some versions of LiteLLM when using tool-calling models with streaming. It is non-blocking but can be resolved by upgrading LiteLLM:
+
+```bash
+pip install --upgrade 'litellm[proxy]'
+```
+
+### LiteLLM: "upstream model provider is currently experiencing high demand"
+
+This is a transient error from the model provider. Wait a moment and retry, or switch to a different model in `litellm_config.yaml`.
+
+### SQLPage not serving updated files
+
+Re-run Steps 1 and 2 to regenerate `dev-src.auto/`, then restart SQLPage.
+
+### Frontend not connecting to chat API
+
+Ensure LiteLLM is running (Step 4) and that the API endpoint in `assistant-ui-chat` matches the LiteLLM proxy address (typically `http://localhost:4000`).
@@ -0,0 +1,10 @@
+## LiteLLM gateway
+
+LITELLM_BASE_URL=http://localhost:4000
+LITELLM_API_KEY=sk-key
+RSSD_PATH=../resource-surveillance.sqlite.db
+
+# Default model alias — must match a model_name in litellm_config.yaml
+
+AI_MODEL=chat
+NEXT_PUBLIC_SQLPAGE_BASE_URL=http://localhost:8080/
@@ -0,0 +1,195 @@
+import {
+  streamText,
+  convertToModelMessages,
+  stepCountIs,
+  createUIMessageStream,
+} from "ai";
+import { createMCPClient } from "@ai-sdk/mcp";
+import { StdioClientTransport } from "@modelcontextprotocol/sdk/client/stdio.js";
+import { createOpenAICompatible } from "@ai-sdk/openai-compatible";
+
+export const maxDuration = 60;
+
+let cachedTableNames: string[] | null = null;
+
+async function getKnownTables(mcpTools: Record<string, { execute?: Function }>): Promise<string[]> {
+  if (cachedTableNames) return cachedTableNames;
+
+  const querySqlTool = mcpTools.query_sql;
+  if (!querySqlTool?.execute) return [];
+
+  try {
+    const result = await querySqlTool.execute(
+      {
+        sql: "SELECT name FROM sqlite_master WHERE type IN ('table', 'view') AND name NOT LIKE 'sqlite_%' ORDER BY name",
+        limit: 200,
+      },
+      {
+        toolCallId: "known-tables-cache",
+        messages: [],
+      },
+    );
+
+    const textContent = (
+      result?.content as Array<{ type?: string; text?: string }> | undefined
+    )?.find((entry) => entry.type === "text")?.text;
+
+    if (!textContent) return [];
+
+    const parsed = JSON.parse(textContent) as {
+      rows?: Array<{ name?: string }>;
+    };
+
+    cachedTableNames =
+      parsed.rows
+        ?.map((row) => row.name)
+        .filter((name): name is string => Boolean(name)) ?? [];
+
+    return cachedTableNames;
+  } catch {
+    return [];
+  }
+}
+
+const open_model = createOpenAICompatible({
+  baseURL: process.env.LITELLM_BASE_URL!,
+  name: process.env.AI_MODEL!,
+  apiKey: process.env.LITELLM_API_KEY!,
+});
+
+const mcpClient = await createMCPClient({
+  transport: new StdioClientTransport({
+    command: "surveilr",
+    args: ["mcp", "server", "-d", process.env.RSSD_PATH!],
+  }),
+});
+
+const tools = await mcpClient.tools();
+
+console.log(
+  "---------------------------------TOOLS---------------------------------------",
+);
+console.log(tools);
+console.log(
+  "-----------------------------------------------------------------------------",
+);
+
+export async function POST(req: Request) {
+  try {
+    const { messages, model } = await req.json();
+
+    if (!messages || !Array.isArray(messages)) {
+      return new Response("Invalid messages", { status: 400 });
+    }
+
+    const knownTables = await getKnownTables(tools as Record<string, { execute?: Function }>);
+
+    const tableHint = knownTables.length
+      ? `\n\nAvailable tables and views in the RSSD (use exact names, do not guess pluralizations or variations):\n${knownTables.join(", ")}.`
+      : "";
+
+    const systemPrompt = `You are an AI assistant connected to a surveilr Resource Surveillance State Database (RSSD) via an MCP server. Your primary capability is answering questions by generating and executing SQL queries against the RSSD — a read-only SQLite database.
+ 
+Use a "Progressive Discovery" strategy: start with lightweight tools and escalate only when needed. You have a maximum of 15 tool calls per response — use them efficiently.
+ 
+Core Constraints:
+- Read-only: Only SELECT statements are permitted. Never attempt INSERT, UPDATE, DELETE, DROP, or any DDL.
+- Row limits: Queries return 10 rows by default, max 50 rows. Request more explicitly only when truly necessary.
+- Text truncation: All text fields are truncated at 200 characters. If a value ends with "... (N chars total)", the full value is longer than displayed.
+- Step budget: You have at most 15 tool calls per response. Prefer the minimum number of calls needed.
+ 
+Available MCP Tools:
+1. Schema Discovery (use these FIRST):
+   - list_tables(): ~50-100 tokens. Use at the start of a new conversation to see what tables exist.
+   - get_table_columns(table_name): ~50-200 tokens. Use once you know which tables are relevant.
+   - get_table_metadata(table_name): Detailed column definitions for a specific table.
+   - get_schema_compact(): ~2k-5k tokens. Use when you need a broad overview of the full database structure.
+   - get_schema(): ~25k-80k tokens. Use only when full metadata and row counts are explicitly required.
+ 
+2. Data Sampling:
+   - get_table_sample(table_name): Returns first 3 rows from a table; text fields truncated to 200 chars.
+   - get_table_stats(table_name): Get row count and basic stats for a table.
+ 
+3. Query Execution:
+   - query_sql(sql, limit?): Execute a SELECT query. Default 10 rows, max 50 rows.
+ 
+4. Ontology Tools:
+   - query_ontology(concept): Look up a concept in the RSSD ontology.
+   - explore_concept(class_name): Explore relationships connected to an ontology class.
+   - list_ontology(): List available ontology classes.
+ 
+Optimal Text-to-SQL Workflow:
+1. MAP: Call \`list_tables()\` first (only if you don't already know the schema from this conversation) to identify candidate tables.
+2. DRILL: Call \`get_table_columns(table_name)\` for only 1-2 tables that look relevant to the user's question.
+3. INSPECT: Call \`get_table_sample(table_name)\` to see example values (text is truncated for efficiency).
+4. QUERY: Use \`query_sql\` with narrow SELECT statements and specific WHERE clauses.
+ 
+- If a user asks for "passed tests," look for QualityFolio (QF) or evidence tables in the schema.
+- Always prefer small, targeted tool calls over broad discovery.
+- When a query returns no results, try relaxing WHERE filters or checking column values via \`get_table_sample\` before concluding the data doesn't exist.
+ 
+Analysis & Recommendations:
+- After retrieving data, ALWAYS provide analysis and actionable recommendations when the user asks for insights, improvements, or recommendations.
+- When asked about improving test pass rates: query relevant test result data, identify failing patterns, and suggest concrete improvement steps based on the data found.
+- When asked about trends: compare data across time, test suites, or categories and highlight notable patterns.
+- When asked for recommendations: base them on actual data retrieved from the RSSD and supplement with testing best practices.
+- Never refuse to provide recommendations simply because you are a database tool — you are an AI analyst that uses the database as your data source.
+- If the data is insufficient to give a full recommendation, state what data was found and what additional data would help.
+
+Behavioral Rules:
+1. Always start with list_tables() on the FIRST turn of a conversation. On subsequent turns, reuse schema already discovered — do not re-run list_tables() or get_table_columns() for already-inspected tables.
+2. Never call get_schema() unless the user explicitly asks for full schema metadata. It is expensive (25k-80k tokens).
+3. Chain tools efficiently: list_tables -> get_table_columns -> query_sql is the default happy path.
+4. Validate before querying: Confirm table and column names exist via discovery tools before writing SQL. Do not guess column names.
+5. Explain truncation: If a text result ends with "... (N chars total)", inform the user the value was truncated and offer to query with a targeted filter.
+6. Limit discipline: Default to limit=10. Only increase to max 50 if the user explicitly needs more data.
+7. SQL safety: Never generate or execute non-SELECT SQL. If the user asks to modify data, explain that the MCP server is read-only.
+8. Surface ontology when relevant: If the user's question involves concepts, classifications, or taxonomy, consider list_ontology() or query_ontology() before writing SQL.
+9. Empty results: If a query returns no rows, inform the user, suggest possible reasons (wrong filter value, different column name), and offer a follow-up query to verify.
+10. Silent execution: Never narrate tool calls, discovery steps, or intermediate findings in the response. Only output the final answer.
+ 
+Anti-Patterns to Avoid:
+- Calling get_schema() on the first turn "just to be safe".
+- Guessing column names without calling get_table_columns() first.
+- Requesting limit=50 when the user only asked for a summary.
+- Re-running list_tables() or get_table_columns() for tables already inspected in this conversation.
+- Treating truncated text values as the full value.
+- Writing JOINs without first confirming the join key columns exist in both tables.${tableHint}`;
+
+    const result = streamText({
+      model: open_model(process.env.AI_MODEL!),
+      tools: tools,
+      messages: await convertToModelMessages(messages),
+      system: systemPrompt,
+      stopWhen: stepCountIs(15),
+      onStepFinish: async ({ toolResults }) => {
+        if (toolResults.length) {
+          console.log(JSON.stringify(toolResults, null, 2));
+        }
+      },
+    });
+
+    return result.toUIMessageStreamResponse({
+      onError: (err) => {
+        console.error("STREAM ERROR:", err);
+        return err instanceof Error ? err.message : "An error occurred while processing your request.";
+      },
+    });
+  } catch (err) {
+    console.error("API ERROR:", err);
+    const errorMessage =
+      err instanceof Error ? err.message : "An unexpected server error occurred.";
+    const stream = createUIMessageStream({
+      execute: ({ writer }) => {
+        writer.write({
+          type: "error",
+          errorText: errorMessage,
+        });
+      },
+    });
+    return new Response(stream, {
+      status: 200,
+      headers: { "Content-Type": "text/plain; charset=utf-8" },
+    });
+  }
+}