diff --git a/src/orchestrator/batch.ts b/src/orchestrator/batch.ts
index 239c6ae..5febfdd 100644
--- a/src/orchestrator/batch.ts
+++ b/src/orchestrator/batch.ts
@@ -35,6 +35,7 @@ export interface CompareOptions {
   judgeModel: string
   answeringModel: string
   sampling?: SamplingConfig
+  questionIds?: string[]
   force?: boolean
 }
 
@@ -146,7 +147,7 @@ export class BatchManager {
   }
 
   async createManifest(options: CompareOptions): Promise<CompareManifest> {
-    const { providers, benchmark, judgeModel, answeringModel, sampling } = options
+    const { providers, benchmark, judgeModel, answeringModel, sampling, questionIds } = options
     const compareId = generateCompareId()
 
     logger.info(`Loading benchmark: ${benchmark}`)
@@ -155,7 +156,37 @@ export class BatchManager {
     const allQuestions = benchmarkInstance.getQuestions()
 
     let targetQuestionIds: string[]
-    if (sampling) {
+    if (questionIds && questionIds.length > 0) {
+      // Validate that all provided IDs exist in the benchmark
+      const allQuestionIdsSet = new Set(allQuestions.map((q) => q.questionId))
+      const validIds: string[] = []
+      const invalidIds: string[] = []
+
+      for (const id of questionIds) {
+        if (allQuestionIdsSet.has(id)) {
+          validIds.push(id)
+        } else {
+          invalidIds.push(id)
+        }
+      }
+
+      if (invalidIds.length > 0) {
+        logger.warn(`Invalid question IDs (will be skipped): ${invalidIds.join(", ")}`)
+      }
+
+      if (validIds.length === 0) {
+        throw new Error(
+          `All provided questionIds are invalid. No matching questions found in benchmark "${benchmark}". ` +
+            `Invalid IDs: ${invalidIds.join(", ")}`
+        )
+      }
+
+      targetQuestionIds = validIds
+      logger.info(
+        `Using explicit questionIds: ${validIds.length} valid questions` +
+          (invalidIds.length > 0 ? ` (${invalidIds.length} invalid skipped)` : "")
+      )
+    } else if (sampling) {
       targetQuestionIds = selectQuestionsBySampling(allQuestions, sampling)
     } else {
       targetQuestionIds = allQuestions.map((q) => q.questionId)
diff --git a/src/orchestrator/index.ts b/src/orchestrator/index.ts
index 64578bb..f19123b 100644
--- a/src/orchestrator/index.ts
+++ b/src/orchestrator/index.ts
@@ -213,8 +213,35 @@ export class Orchestrator {
       effectiveLimit = limit
 
       if (questionIds && questionIds.length > 0) {
-        logger.info(`Using explicit questionIds: ${questionIds.length} questions`)
-        targetQuestionIds = questionIds
+        // Validate that all provided IDs exist in the benchmark
+        const allQuestionIdsSet = new Set(allQuestions.map((q) => q.questionId))
+        const validIds: string[] = []
+        const invalidIds: string[] = []
+
+        for (const id of questionIds) {
+          if (allQuestionIdsSet.has(id)) {
+            validIds.push(id)
+          } else {
+            invalidIds.push(id)
+          }
+        }
+
+        if (invalidIds.length > 0) {
+          logger.warn(`Invalid question IDs (will be skipped): ${invalidIds.join(", ")}`)
+        }
+
+        if (validIds.length === 0) {
+          throw new Error(
+            `All provided questionIds are invalid. No matching questions found in benchmark "${benchmarkName}". ` +
+              `Invalid IDs: ${invalidIds.join(", ")}`
+          )
+        }
+
+        targetQuestionIds = validIds
+        logger.info(
+          `Using explicit questionIds: ${validIds.length} valid questions` +
+            (invalidIds.length > 0 ? ` (${invalidIds.length} invalid skipped)` : "")
+        )
       } else if (sampling) {
         logger.info(`Using sampling mode: ${sampling.mode}`)
         targetQuestionIds = selectQuestionsBySampling(allQuestions, sampling)
diff --git a/src/server/routes/benchmarks.ts b/src/server/routes/benchmarks.ts
index af0b377..6860315 100644
--- a/src/server/routes/benchmarks.ts
+++ b/src/server/routes/benchmarks.ts
@@ -128,6 +128,75 @@ export async function handleBenchmarksRoutes(req: Request, url: URL): Promise<Re
     }
   }
 
+  // POST /api/benchmarks/:name/expand-ids - Expand conversation/session patterns to question IDs
+  const expandIdsMatch = pathname.match(/^\/api\/benchmarks\/([^/]+)\/expand-ids$/)
+  if (method === "POST" && expandIdsMatch) {
+    const benchmarkName = expandIdsMatch[1]
+
+    try {
+      const body = await req.json()
+      const { patterns } = body as { patterns: string[] }
+
+      if (!patterns || !Array.isArray(patterns)) {
+        return json({ error: "patterns array is required" }, 400)
+      }
+
+      const benchmark = createBenchmark(benchmarkName as any)
+      await benchmark.load()
+      const allQuestions = benchmark.getQuestions()
+
+      const expandedIds = new Set<string>()
+      const patternResults: Record<string, string[]> = {}
+
+      for (const pattern of patterns) {
+        const trimmed = pattern.trim()
+        if (!trimmed) continue
+
+        const expanded: string[] = []
+
+        // Pattern 1: Conversation ID (e.g., "conv-26") - expand to all questions
+        // Check if pattern ends with a number and doesn't have -q or -session suffix
+        if (/^[a-zA-Z]+-\d+$/.test(trimmed)) {
+          const matchingQuestions = allQuestions.filter((q) =>
+            q.questionId.startsWith(trimmed + "-q")
+          )
+          matchingQuestions.forEach((q) => {
+            expanded.push(q.questionId)
+            expandedIds.add(q.questionId)
+          })
+        }
+        // Pattern 2: Session ID (e.g., "conv-26-session_1" or "001be529-session-0")
+        // Find all questions that reference this session
+        else if (trimmed.includes("-session")) {
+          const matchingQuestions = allQuestions.filter((q) =>
+            q.haystackSessionIds.includes(trimmed)
+          )
+          matchingQuestions.forEach((q) => {
+            expanded.push(q.questionId)
+            expandedIds.add(q.questionId)
+          })
+        }
+        // Pattern 3: Direct question ID - add as-is if it exists
+        else {
+          const exactMatch = allQuestions.find((q) => q.questionId === trimmed)
+          if (exactMatch) {
+            expanded.push(trimmed)
+            expandedIds.add(trimmed)
+          }
+        }
+
+        patternResults[pattern] = expanded
+      }
+
+      return json({
+        expandedIds: Array.from(expandedIds),
+        patternResults,
+      })
+    } catch (e) {
+      return json({ error: e instanceof Error ? e.message : "Failed to expand IDs" }, 400)
+    }
+  }
+
   // GET /api/models - List available models
   if (method === "GET" && pathname === "/api/models") {
     const openai = listModelsByProvider("openai").map((alias) => ({
diff --git a/src/server/routes/compare.ts b/src/server/routes/compare.ts
index c31589f..7c81f75 100644
--- a/src/server/routes/compare.ts
+++ b/src/server/routes/compare.ts
@@ -146,7 +146,8 @@ export async function handleCompareRoutes(req: Request, url: URL): Promise<Respo
   if (method === "POST" && pathname === "/api/compare/start") {
     try {
       const body = await req.json()
-      const { providers, benchmark, judgeModel, answeringModel, sampling, force } = body
+      const { providers, benchmark, judgeModel, answeringModel, sampling, questionIds, force } =
+        body
 
       if (!providers || !Array.isArray(providers) || providers.length === 0) {
         return json({ error: "Missing or invalid providers array" }, 400)
@@ -165,6 +166,7 @@ export async function handleCompareRoutes(req: Request, url: URL): Promise<Respo
         judgeModel,
         answeringModel,
         sampling,
+        questionIds,
         force,
       })
 
@@ -387,6 +389,7 @@ async function initializeComparison(options: {
   judgeModel: string
   answeringModel: string
   sampling?: SamplingConfig
+  questionIds?: string[]
   force?: boolean
 }): Promise<{ compareId: string }> {
   // Only await manifest creation - this is fast
diff --git a/src/server/routes/runs.ts b/src/server/routes/runs.ts
index 1aaab7b..5002cfd 100644
--- a/src/server/routes/runs.ts
+++ b/src/server/routes/runs.ts
@@ -190,12 +190,14 @@ export async function handleRunsRoutes(req: Request, url: URL): Promise<Response
         answeringModel,
         limit,
         sampling,
+        questionIds,
         concurrency,
         force,
         fromPhase,
         sourceRunId,
       } = body
       console.log("[API] Extracted sampling:", sampling)
+      console.log("[API] Extracted questionIds:", questionIds)
       console.log("[API] Extracted concurrency:", concurrency)
 
       if (!provider || !benchmark || !runId || !judgeModel) {
@@ -279,6 +281,7 @@ export async function handleRunsRoutes(req: Request, url: URL): Promise<Response
         answeringModel,
         limit,
         sampling,
+        questionIds,
         concurrency,
         force: sourceRunId ? false : force,
         fromPhase: fromPhase as PhaseId | undefined,
@@ -374,6 +377,7 @@ async function runBenchmark(options: {
   answeringModel?: string
   limit?: number
   sampling?: SamplingConfig
+  questionIds?: string[]
   concurrency?: ConcurrencyConfig
   force?: boolean
   fromPhase?: PhaseId
@@ -396,6 +400,7 @@ async function runBenchmark(options: {
       answeringModel: options.answeringModel,
       limit: options.limit,
       sampling: options.sampling,
+      questionIds: options.questionIds,
       concurrency: options.concurrency,
       force: options.force,
       phases,
diff --git a/ui/app/compare/new/page.tsx b/ui/app/compare/new/page.tsx
index a9f3d86..e095b84 100644
--- a/ui/app/compare/new/page.tsx
+++ b/ui/app/compare/new/page.tsx
@@ -8,6 +8,8 @@ import {
   getBenchmarks,
   getModels,
   startCompare,
+  expandQuestionIdPatterns,
+  getBenchmarkQuestions,
   type SelectionMode,
   type SampleType,
   type SamplingConfig,
@@ -35,9 +37,18 @@ export default function NewComparePage() {
     sampleType: "consecutive" as SampleType,
     perCategory: "2",
     limit: "",
+    questionIds: "",
   })
 
   const [editingCompareId, setEditingCompareId] = useState(false)
+  const [validatingQuestionIds, setValidatingQuestionIds] = useState(false)
+  const [questionIdValidation, setQuestionIdValidation] = useState<{
+    valid: string[]
+    invalid: string[]
+    total: number
+    expanded: string[]
+    patternResults: Record<string, string[]>
+  } | null>(null)
   const compareIdInputRef = useRef<HTMLInputElement>(null)
 
   useEffect(() => {
@@ -72,6 +83,70 @@ export default function NewComparePage() {
     }
   }
 
+  async function validateQuestionIds(
+    benchmark: string,
+    questionIdsInput: string
+  ): Promise<{
+    valid: string[]
+    invalid: string[]
+    total: number
+    expanded: string[]
+    patternResults: Record<string, string[]>
+  }> {
+    // Parse input: split by comma, trim, remove duplicates
+    const inputPatterns = questionIdsInput
+      .split(",")
+      .map((id) => id.trim())
+      .filter((id) => id.length > 0)
+    const uniquePatterns = [...new Set(inputPatterns)]
+
+    // Call pattern expansion endpoint
+    const expansionResult = await expandQuestionIdPatterns(benchmark, uniquePatterns)
+    const expandedIds = expansionResult.expandedIds
+
+    // Fetch all questions to validate expanded IDs exist
+    const allQuestionIds = new Set<string>()
+    let page = 1
+    let hasMore = true
+
+    while (hasMore) {
+      const response = await getBenchmarkQuestions(benchmark, {
+        page,
+        limit: 100,
+      })
+      response.questions.forEach((q) => allQuestionIds.add(q.questionId))
+      hasMore = page < response.pagination.totalPages
+      page++
+    }
+
+    // Validate expanded IDs
+    const valid: string[] = []
+    const invalid: string[] = []
+
+    expandedIds.forEach((id) => {
+      if (allQuestionIds.has(id)) {
+        valid.push(id)
+      } else {
+        invalid.push(id)
+      }
+    })
+
+    // Find patterns that didn't expand to anything
+    const patternsWithNoResults = uniquePatterns.filter(
+      (pattern) =>
+        !expansionResult.patternResults[pattern] ||
+        expansionResult.patternResults[pattern].length === 0
+    )
+
+    return {
+      valid,
+      invalid: [...invalid, ...patternsWithNoResults],
+      total: uniquePatterns.length,
+      expanded: expandedIds,
+      patternResults: expansionResult.patternResults,
+    }
+  }
+
   function generateCompareId() {
     const now = new Date()
     const date = now.toISOString().slice(0, 10).replace(/-/g, "")
@@ -93,6 +168,7 @@ export default function NewComparePage() {
     const compareId = form.compareId || generateCompareId()
 
     let sampling: SamplingConfig | undefined
+    let questionIds: string[] | undefined
     if (form.selectionMode === "full") {
       sampling = { mode: "full" }
     } else if (form.selectionMode === "sample") {
@@ -107,6 +183,20 @@ export default function NewComparePage() {
         mode: "limit",
         limit: parseInt(form.limit),
       }
+    } else if (form.selectionMode === "questionIds") {
+      if (!form.questionIds.trim()) {
+        setError("Please enter at least one pattern or question ID")
+        return
+      }
+
+      // Require validation before submission (MANDATORY)
+      if (!questionIdValidation || questionIdValidation.invalid.length > 0) {
+        setError("Please validate patterns before starting the comparison")
+        return
+      }
+
+      // Use the expanded question IDs from validation
+      questionIds = questionIdValidation.expanded
     }
 
     try {
@@ -120,6 +210,7 @@ export default function NewComparePage() {
         judgeModel: form.judgeModel,
         answeringModel: form.answeringModel,
         sampling,
+        questionIds,
       })
 
       router.push(`/compare`)
@@ -273,14 +364,22 @@ export default function NewComparePage() {
             Question Selection
           </label>
           <div className="flex gap-0 mb-4">
-            {(["full", "sample", "limit"] as SelectionMode[]).map((mode) => {
+            {(["full", "sample", "limit", "questionIds"] as SelectionMode[]).map((mode) => {
               const isSelected = form.selectionMode === mode
-              const labels = { full: "Full", sample: "Sample", limit: "Limit" }
+              const labels = {
+                full: "Full",
+                sample: "Sample",
+                limit: "Limit",
+                questionIds: "IDs",
+              }
               return (
                 <button
                   key={mode}
                   type="button"
-                  onClick={() => setForm({ ...form, selectionMode: mode })}
+                  onClick={() => {
+                    setForm({ ...form, selectionMode: mode })
+                    setQuestionIdValidation(null)
+                  }}
                   className="px-3 py-1.5 text-sm font-medium transition-colors border-t border-b border-r first:border-l first:rounded-l last:rounded-r"
                   style={{
                     fontFamily: "'Space Grotesk', sans-serif",
@@ -343,6 +442,100 @@ export default function NewComparePage() {
               />
             </div>
           )}
+
+          {form.selectionMode === "questionIds" && (
+            <div className="space-y-3">
+              <div>
+                <label className="block text-sm text-text-secondary mb-2">
+                  Question IDs (comma-separated)
+                </label>
+                <textarea
+                  className="w-full px-3 py-2 text-sm bg-[#222222] border border-[#444444] rounded text-text-primary placeholder-text-muted focus:outline-none focus:border-accent font-mono"
+                  rows={4}
+                  value={form.questionIds}
+                  onChange={(e) => {
+                    setForm({ ...form, questionIds: e.target.value })
+                    setQuestionIdValidation(null)
+                  }}
+                  placeholder="e.g., conv-30, conv-30-q0, conv-30-session_1"
+                />
+                <p className="text-xs text-text-muted mt-1">
+                  Enter question IDs, conversation IDs (e.g., conv-26), or session IDs (e.g.,
+                  conv-26-session_1), separated by commas
+                </p>
+              </div>
+
+              {/* Validation Button */}
+              <button
+                type="button"
+                onClick={async () => {
+                  if (!form.questionIds.trim()) {
+                    setError("Please enter at least one question ID")
+                    return
+                  }
+                  if (!form.benchmark) {
+                    setError("Please select a benchmark first")
+                    return
+                  }
+
+                  setValidatingQuestionIds(true)
+                  setError(null)
+                  try {
+                    const validation = await validateQuestionIds(form.benchmark, form.questionIds)
+                    setQuestionIdValidation(validation)
+
+                    if (validation.invalid.length > 0) {
+                      setError(`Invalid question IDs: ${validation.invalid.join(", ")}`)
+                    }
+                  } catch (e) {
+                    setError(e instanceof Error ? e.message : "Failed to validate question IDs")
+                  } finally {
+                    setValidatingQuestionIds(false)
+                  }
+                }}
+                disabled={validatingQuestionIds || !form.benchmark || !form.questionIds.trim()}
+                className="px-3 py-1.5 text-sm bg-[#222222] border border-[#444444] rounded text-text-primary hover:border-accent disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
+              >
+                {validatingQuestionIds ? (
+                  <>
+                    <div className="inline-block w-3 h-3 border-2 border-accent border-t-transparent rounded-full animate-spin mr-2" />
+                    Validating...
+                  </>
+                ) : (
+                  "Validate Question IDs"
+                )}
+              </button>
+
+              {/* Validation Result */}
+              {questionIdValidation && (
+                <div
+                  className={`p-3 rounded text-sm border ${
+                    questionIdValidation.invalid.length === 0
+                      ? "bg-green-500/10 border-green-500/20 text-green-400"
+                      : "bg-yellow-500/10 border-yellow-500/20 text-yellow-400"
+                  }`}
+                >
+                  <div className="font-medium mb-1">
+                    {questionIdValidation.invalid.length === 0
+                      ? `✓ Valid: ${questionIdValidation.total} patterns expanded to ${questionIdValidation.expanded.length} questions`
+                      : `⚠ ${questionIdValidation.valid.length} valid, ${questionIdValidation.invalid.length} invalid patterns`}
+                  </div>
+                  {questionIdValidation.invalid.length > 0 && (
+                    <div className="text-xs mt-1">
+                      Invalid: {questionIdValidation.invalid.join(", ")}
+                    </div>
+                  )}
+                  {questionIdValidation.expanded.length > 0 && (
+                    <div className="text-xs mt-2 opacity-80">
+                      Sample expanded IDs: {questionIdValidation.expanded.slice(0, 5).join(", ")}
+                      {questionIdValidation.expanded.length > 5 &&
+                        ` ...and ${questionIdValidation.expanded.length - 5} more`}
+                    </div>
+                  )}
+                </div>
+              )}
+            </div>
+          )}
         </div>
 
         {error && (
diff --git a/ui/app/runs/new/page.tsx b/ui/app/runs/new/page.tsx
index ae3b222..5087962 100644
--- a/ui/app/runs/new/page.tsx
+++ b/ui/app/runs/new/page.tsx
@@ -9,6 +9,8 @@ import {
   getModels,
   startRun,
   getCompletedRuns,
+  expandQuestionIdPatterns,
+  getBenchmarkQuestions,
   type RunSummary,
   type PhaseId,
   PHASE_ORDER,
@@ -43,6 +45,7 @@ export default function NewRunPage() {
     sampleType: "consecutive" as SampleType,
     perCategory: "2",
     limit: "",
+    questionIds: "",
     concurrency: {
       default: undefined as number | undefined,
       ingest: undefined as number | undefined,
@@ -67,6 +70,14 @@ export default function NewRunPage() {
   const [showAdvancedConcurrencyNew, setShowAdvancedConcurrencyNew] = useState(false)
   const [showAdvancedConcurrencyAdvanced, setShowAdvancedConcurrencyAdvanced] = useState(false)
   const [editingPhase, setEditingPhase] = useState<string | null>(null)
+  const [validatingQuestionIds, setValidatingQuestionIds] = useState(false)
+  const [questionIdValidation, setQuestionIdValidation] = useState<{
+    valid: string[]
+    invalid: string[]
+    total: number
+    expanded: string[]
+    patternResults: Record<string, string[]>
+  } | null>(null)
   const runIdInputRef = useRef<HTMLInputElement>(null)
   const advancedRunIdInputRef = useRef<HTMLInputElement>(null)
   const concurrencyInputRef = useRef<HTMLInputElement>(null)
@@ -212,6 +223,70 @@ export default function NewRunPage() {
     }
   }
 
+  async function validateQuestionIds(
+    benchmark: string,
+    questionIdsInput: string
+  ): Promise<{
+    valid: string[]
+    invalid: string[]
+    total: number
+    expanded: string[]
+    patternResults: Record<string, string[]>
+  }> {
+    // Parse input: split by comma, trim, remove duplicates
+    const inputPatterns = questionIdsInput
+      .split(",")
+      .map((id) => id.trim())
+      .filter((id) => id.length > 0)
+    const uniquePatterns = [...new Set(inputPatterns)]
+
+    // Call pattern expansion endpoint
+    const expansionResult = await expandQuestionIdPatterns(benchmark, uniquePatterns)
+    const expandedIds = expansionResult.expandedIds
+
+    // Fetch all questions to validate expanded IDs exist
+    const allQuestionIds = new Set<string>()
+    let page = 1
+    let hasMore = true
+
+    while (hasMore) {
+      const response = await getBenchmarkQuestions(benchmark, {
+        page,
+        limit: 100,
+      })
+      response.questions.forEach((q) => allQuestionIds.add(q.questionId))
+      hasMore = page < response.pagination.totalPages
+      page++
+    }
+
+    // Validate expanded IDs
+    const valid: string[] = []
+    const invalid: string[] = []
+
+    expandedIds.forEach((id) => {
+      if (allQuestionIds.has(id)) {
+        valid.push(id)
+      } else {
+        invalid.push(id)
+      }
+    })
+
+    // Find patterns that didn't expand to anything
+    const patternsWithNoResults = uniquePatterns.filter(
+      (pattern) =>
+        !expansionResult.patternResults[pattern] ||
+        expansionResult.patternResults[pattern].length === 0
+    )
+
+    return {
+      valid,
+      invalid: [...invalid, ...patternsWithNoResults],
+      total: uniquePatterns.length,
+      expanded: expandedIds,
+      patternResults: expansionResult.patternResults,
+    }
+  }
+
   function generateRunId() {
     const timestamp = new Date().toISOString().slice(0, 10).replace(/-/g, "")
     const random = Math.random().toString(36).slice(2, 6)
@@ -252,6 +327,7 @@ export default function NewRunPage() {
         : form.answeringModel
 
     let sampling: SamplingConfig | undefined
+    let questionIds: string[] | undefined
     if (activeTab === "new") {
       console.log("Form state:", {
         selectionMode: form.selectionMode,
@@ -272,6 +348,20 @@ export default function NewRunPage() {
           mode: "limit",
           limit: parseInt(form.limit),
         }
+      } else if (form.selectionMode === "questionIds") {
+        if (!form.questionIds.trim()) {
+          setError("Please enter at least one pattern or question ID")
+          return
+        }
+
+        // Require validation before submission (MANDATORY)
+        if (!questionIdValidation || questionIdValidation.invalid.length > 0) {
+          setError("Please validate patterns before starting the run")
+          return
+        }
+
+        // Use the expanded question IDs from validation
+        questionIds = questionIdValidation.expanded
       }
     }
     console.log("Submitting with sampling config:", sampling)
@@ -307,6 +397,7 @@ export default function NewRunPage() {
         judgeModel,
         answeringModel,
         sampling,
+        questionIds,
         concurrency,
         force: activeTab === "new",
         fromPhase,
@@ -871,14 +962,22 @@ export default function NewRunPage() {
                 Question Selection
               </label>
               <div className="flex gap-0 mb-4">
-                {(["full", "sample", "limit"] as SelectionMode[]).map((mode) => {
+                {(["full", "sample", "limit", "questionIds"] as SelectionMode[]).map((mode) => {
                   const isSelected = form.selectionMode === mode
-                  const labels = { full: "Full", sample: "Sample", limit: "Limit" }
+                  const labels = {
+                    full: "Full",
+                    sample: "Sample",
+                    limit: "Limit",
+                    questionIds: "IDs",
+                  }
                   return (
                     <button
                       key={mode}
                       type="button"
-                      onClick={() => setForm({ ...form, selectionMode: mode })}
+                      onClick={() => {
+                        setForm({ ...form, selectionMode: mode })
+                        setQuestionIdValidation(null)
+                      }}
                       className="px-3 py-1.5 text-sm font-medium transition-colors border-t border-b border-r first:border-l first:rounded-l last:rounded-r"
                       style={{
                         fontFamily: "'Space Grotesk', sans-serif",
@@ -941,6 +1040,104 @@ export default function NewRunPage() {
                   />
                 </div>
               )}
+
+              {form.selectionMode === "questionIds" && (
+                <div className="space-y-3">
+                  <div>
+                    <label className="block text-sm text-text-secondary mb-2">
+                      Question IDs (comma-separated)
+                    </label>
+                    <textarea
+                      className="w-full px-3 py-2 text-sm bg-[#222222] border border-[#444444] rounded text-text-primary placeholder-text-muted focus:outline-none focus:border-accent font-mono"
+                      rows={4}
+                      value={form.questionIds}
+                      onChange={(e) => {
+                        setForm({ ...form, questionIds: e.target.value })
+                        setQuestionIdValidation(null)
+                      }}
+                      placeholder="e.g., conv-30, conv-30-q0, conv-30-session_1"
+                    />
+                    <p className="text-xs text-text-muted mt-1">
+                      Enter question IDs, conversation IDs (e.g., conv-26), or session IDs (e.g.,
+                      conv-26-session_1), separated by commas
+                    </p>
+                  </div>
+
+                  {/* Validation Button */}
+                  <button
+                    type="button"
+                    onClick={async () => {
+                      if (!form.questionIds.trim()) {
+                        setError("Please enter at least one question ID")
+                        return
+                      }
+                      if (!form.benchmark) {
+                        setError("Please select a benchmark first")
+                        return
+                      }
+
+                      setValidatingQuestionIds(true)
+                      setError(null)
+                      try {
+                        const validation = await validateQuestionIds(
+                          form.benchmark,
+                          form.questionIds
+                        )
+                        setQuestionIdValidation(validation)
+
+                        if (validation.invalid.length > 0) {
+                          setError(`Invalid question IDs: ${validation.invalid.join(", ")}`)
+                        }
+                      } catch (e) {
+                        setError(e instanceof Error ? e.message : "Failed to validate question IDs")
+                      } finally {
+                        setValidatingQuestionIds(false)
+                      }
+                    }}
+                    disabled={validatingQuestionIds || !form.benchmark || !form.questionIds.trim()}
+                    className="px-3 py-1.5 text-sm bg-[#222222] border border-[#444444] rounded text-text-primary hover:border-accent disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
+                  >
+                    {validatingQuestionIds ? (
+                      <>
+                        <div className="inline-block w-3 h-3 border-2 border-accent border-t-transparent rounded-full animate-spin mr-2" />
+                        Validating...
+                      </>
+                    ) : (
+                      "Validate Question IDs"
+                    )}
+                  </button>
+
+                  {/* Validation Result */}
+                  {questionIdValidation && (
+                    <div
+                      className={`p-3 rounded text-sm border ${
+                        questionIdValidation.invalid.length === 0
+                          ? "bg-green-500/10 border-green-500/20 text-green-400"
+                          : "bg-yellow-500/10 border-yellow-500/20 text-yellow-400"
+                      }`}
+                    >
+                      <div className="font-medium mb-1">
+                        {questionIdValidation.invalid.length === 0
+                          ? `✓ Valid: ${questionIdValidation.total} patterns expanded to ${questionIdValidation.expanded.length} questions`
+                          : `⚠ ${questionIdValidation.valid.length} valid, ${questionIdValidation.invalid.length} invalid patterns`}
+                      </div>
+                      {questionIdValidation.invalid.length > 0 && (
+                        <div className="text-xs mt-1">
+                          Invalid: {questionIdValidation.invalid.join(", ")}
+                        </div>
+                      )}
+                      {questionIdValidation.expanded.length > 0 && (
+                        <div className="text-xs mt-2 opacity-80">
+                          Sample expanded IDs:{" "}
+                          {questionIdValidation.expanded.slice(0, 5).join(", ")}
+                          {questionIdValidation.expanded.length > 5 &&
+                            ` ...and ${questionIdValidation.expanded.length - 5} more`}
+                        </div>
+                      )}
+                    </div>
+                  )}
+                </div>
+              )}
             </div>
 
             <div>
diff --git a/ui/lib/api.ts b/ui/lib/api.ts
index 8a22190..8576e90 100644
--- a/ui/lib/api.ts
+++ b/ui/lib/api.ts
@@ -149,7 +149,7 @@ export const PHASE_ORDER: PhaseId[] = [
   "report",
 ]
 
-export type SelectionMode = "full" | "sample" | "limit"
+export type SelectionMode = "full" | "sample" | "limit" | "questionIds"
 export type SampleType = "consecutive" | "random"
 
 export interface SamplingConfig {
@@ -176,6 +176,7 @@ export async function startRun(params: {
   answeringModel?: string
   limit?: number
   sampling?: SamplingConfig
+  questionIds?: string[]
   concurrency?: ConcurrencyConfig
   force?: boolean
   fromPhase?: PhaseId
@@ -221,6 +222,16 @@ export async function getBenchmarkQuestions(
   return fetchApi(`/api/benchmarks/${benchmark}/questions${query ? `?${query}` : ""}`)
 }
 
+export async function expandQuestionIdPatterns(
+  benchmark: string,
+  patterns: string[]
+): Promise<{ expandedIds: string[]; patternResults: Record<string, string[]> }> {
+  return fetchApi(`/api/benchmarks/${benchmark}/expand-ids`, {
+    method: "POST",
+    body: JSON.stringify({ patterns }),
+  })
+}
+
 export async function getModels(): Promise<{
   models: { openai: any[]; anthropic: any[]; google: any[] }
 }> {
@@ -445,6 +456,7 @@ export async function startCompare(params: {
   judgeModel: string
   answeringModel?: string
   sampling?: SamplingConfig
+  questionIds?: string[]
 }): Promise<{ message: string; compareId: string }> {
   return fetchApi("/api/compare/start", {
     method: "POST",