AutomateThePlanet
diff --git a/‎src/Spectra.CLI/Agent/Copilot/GenerationAgent.cs‎
Lines changed: 2 additions & 2 deletions b/‎src/Spectra.CLI/Agent/Copilot/GenerationAgent.cs‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/Spectra.CLI/Commands/Generate/GenerateHandler.cs‎
Lines changed: 33 additions & 10 deletions b/‎src/Spectra.CLI/Commands/Generate/GenerateHandler.cs‎
Lines changed: 33 additions & 10 deletions
diff --git a/‎src/Spectra.CLI/Progress/ProgressManager.cs‎
Lines changed: 14 additions & 3 deletions b/‎src/Spectra.CLI/Progress/ProgressManager.cs‎
Lines changed: 14 additions & 3 deletions
diff --git a/‎src/Spectra.CLI/Progress/ProgressPageWriter.cs‎
Lines changed: 17 additions & 24 deletions b/‎src/Spectra.CLI/Progress/ProgressPageWriter.cs‎
Lines changed: 17 additions & 24 deletions
diff --git a/‎src/Spectra.CLI/Skills/Content/Agents/spectra-execution.agent.md‎
Lines changed: 17 additions & 14 deletions b/‎src/Spectra.CLI/Skills/Content/Agents/spectra-execution.agent.md‎
Lines changed: 17 additions & 14 deletions
diff --git a/‎src/Spectra.CLI/Skills/Content/Agents/spectra-generation.agent.md‎
Lines changed: 22 additions & 20 deletions b/‎src/Spectra.CLI/Skills/Content/Agents/spectra-generation.agent.md‎
Lines changed: 22 additions & 20 deletions
diff --git a/‎src/Spectra.CLI/Skills/Content/Skills/spectra-coverage.md‎
Lines changed: 2 additions & 2 deletions b/‎src/Spectra.CLI/Skills/Content/Skills/spectra-coverage.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/Spectra.CLI/Skills/Content/Skills/spectra-criteria.md‎
Lines changed: 2 additions & 2 deletions b/‎src/Spectra.CLI/Skills/Content/Skills/spectra-criteria.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/Spectra.CLI/Skills/Content/Skills/spectra-dashboard.md‎
Lines changed: 2 additions & 2 deletions b/‎src/Spectra.CLI/Skills/Content/Skills/spectra-dashboard.md‎
Lines changed: 2 additions & 2 deletions
@@ -305,13 +305,13 @@ Do NOT include any explanatory text before or after the JSON. Output ONLY the JS
 
             {userPrompt}
 
-            {(string.IsNullOrEmpty(criteriaContext) ? "" : $"\n## ACCEPTANCE CRITERIA\n\n{criteriaContext}\n")}
+            {(string.IsNullOrEmpty(criteriaContext) ? "" : $"\n## ACCEPTANCE CRITERIA — MANDATORY\n\nYou MUST map each test case to matching acceptance criteria below. Every test MUST have at least one criterion ID in its \"criteria\" array. If a test doesn't match any criterion, use the closest related one.\n\n{criteriaContext}\n")}
             IMPORTANT:
             1. Use the tools to read documentation and check for duplicates first
             2. Only generate tests that are grounded in the documentation
             3. Ensure unique test IDs using GetNextTestIds
             4. Your FINAL response must be ONLY the JSON array — no other text
-            5. If acceptance criteria are provided, include matching criterion IDs in the "criteria" array field
+            5. MANDATORY: For each test, populate the "criteria" array with IDs of acceptance criteria it verifies (e.g. ["AC-REPORTING-001", "AC-REPORTING-003"]). Never leave criteria empty when acceptance criteria are provided above.
             """;
     }
 
 
@@ -1445,6 +1445,7 @@ private async Task<int> ExecuteFromDescriptionAsync(
             Steps = test.Steps,
             ExpectedResult = test.ExpectedResult,
             TestData = test.TestData,
+            Criteria = test.Criteria,
             FilePath = Path.GetRelativePath(testsPath, filePath),
             Grounding = test.Grounding
         };
@@ -1729,6 +1730,7 @@ internal static TestCase CreateTestWithGrounding(
                 Steps = test.Steps,
                 ExpectedResult = test.ExpectedResult,
                 TestData = test.TestData,
+                Criteria = test.Criteria,
                 FilePath = Path.GetRelativePath(testsPath, filePath),
                 Grounding = test.Grounding
             };
@@ -1758,6 +1760,7 @@ internal static TestCase CreateTestWithGrounding(
             Steps = test.Steps,
             ExpectedResult = test.ExpectedResult,
             TestData = test.TestData,
+            Criteria = test.Criteria,
             FilePath = Path.GetRelativePath(testsPath, filePath),
             Grounding = grounding
         };
@@ -1961,20 +1964,40 @@ private void ShowCountMismatchReason(
         if (allCriteria.Count == 0)
             return null;
 
-        // Filter: criteria from documents matching suite name, or criteria with matching component
+        // Filter: criteria matching suite name (exact or partial match on component, source doc, or file name)
         var relevant = allCriteria.Where(c =>
-            // Match by source document name (e.g., suite "checkout" matches "checkout.criteria.yaml")
-            (c.SourceDoc != null && Path.GetFileNameWithoutExtension(c.SourceDoc)
-                .Equals(suiteName, StringComparison.OrdinalIgnoreCase)) ||
-            // Match by component field
+            // Exact match by component
             (c.Component != null && c.Component.Equals(suiteName, StringComparison.OrdinalIgnoreCase)) ||
-            // Match by criteria file name (e.g., "checkout.criteria.yaml" for suite "checkout")
-            criteriaFiles.Any(f => Path.GetFileName(f)
-                .StartsWith(suiteName + ".", StringComparison.OrdinalIgnoreCase) &&
-                allCriteria.IndexOf(c) >= 0)
+            // Component contains suite name (e.g., suite "reporting" matches component "reporting-analytics")
+            (c.Component != null && c.Component.Contains(suiteName, StringComparison.OrdinalIgnoreCase)) ||
+            // Suite contains component (e.g., suite "reporting-analytics" matches component "reporting")
+            (c.Component != null && suiteName.Contains(c.Component, StringComparison.OrdinalIgnoreCase)) ||
+            // Source doc file name contains suite name
+            (c.SourceDoc != null && Path.GetFileNameWithoutExtension(c.SourceDoc)
+                .Contains(suiteName, StringComparison.OrdinalIgnoreCase))
         ).ToList();
 
-        // If no suite-specific criteria found, use all criteria (better than none)
+        // Also include criteria from files whose name starts with the suite name
+        if (relevant.Count == 0)
+        {
+            var matchingFiles = criteriaFiles.Where(f =>
+                Path.GetFileNameWithoutExtension(f).Replace(".criteria", "")
+                    .Contains(suiteName, StringComparison.OrdinalIgnoreCase)).ToList();
+
+            if (matchingFiles.Count > 0)
+            {
+                var matchingFileSet = new HashSet<string>(matchingFiles, StringComparer.OrdinalIgnoreCase);
+                // Reload only from matching files
+                relevant = new List<AcceptanceCriterion>();
+                foreach (var file in matchingFiles)
+                {
+                    var fileCriteria = await reader.ReadAsync(file, ct);
+                    relevant.AddRange(fileCriteria);
+                }
+            }
+        }
+
+        // Last resort: use all criteria (better than none, but may be noisy)
         if (relevant.Count == 0)
             relevant = allCriteria;
 
 
@@ -46,15 +46,26 @@ internal ProgressManager(string command, string[] phases, string resultPath, str
     public string ResultPath => _resultPath;
     public string ProgressPath => _progressPath;
 
-    /// <summary>Delete stale files from previous runs.</summary>
+    /// <summary>
+    /// Reset stale files from previous runs.
+    /// Writes a "starting" placeholder HTML so the browser shows a loading state
+    /// (with auto-refresh enabled) instead of the previous run's completed state.
+    /// </summary>
     public void Reset()
     {
         try
         {
             if (File.Exists(_resultPath))
                 File.Delete(_resultPath);
-            if (File.Exists(_progressPath))
-                File.Delete(_progressPath);
+
+            var placeholder = new CommandResult
+            {
+                Command = _command,
+                Status = "starting",
+                Message = "Initializing..."
+            };
+            var json = JsonSerializer.Serialize(placeholder, ResultFileOptions);
+            ProgressPageWriter.WriteProgressPage(_progressPath, json, isTerminal: false, _title);
         }
         catch
         {
 
@@ -471,15 +471,15 @@ .breakdown h3 {
                     {{BuildBody(jsonData, isTerminal, workspaceRoot)}}
                 </div>
                 <script>
-                    // Auto-refresh: reload page every 1.5s while status is not terminal.
-                    // Uses JavaScript instead of <meta refresh> for reliable file:// support.
+                    // Auto-refresh: always reload with cache-busting query parameter.
+                    // Runs even on terminal pages so that when a new run starts and
+                    // overwrites the file, a stale "Completed" page picks up the change.
+                    // Uses cache-busting query param because Chromium caches file:// URLs.
                     (function() {
-                        var isTerminal = {{(isTerminal ? "true" : "false")}};
-                        if (!isTerminal) {
-                            setInterval(function() {
-                                window.location.reload();
-                            }, 1500);
-                        }
+                        setInterval(function() {
+                            var base = window.location.pathname;
+                            window.location.replace(base + '?_=' + Date.now());
+                        }, 1500);
                     })();
 
                     // File links: open vscode:// URIs via JavaScript click handler
@@ -647,22 +647,15 @@ private static string BuildBody(string jsonData, bool isTerminal, string workspa
                 sb.Append(BuildFilesSection(files, workspaceRoot));
             }
 
-            // Footer
-            if (!isTerminal)
-            {
-                sb.Append("""
-                    <div class="footer">
-                        <span class="refresh-indicator">
-                            <span class="refresh-dot"></span>
-                            Auto-refreshing every 1.5 seconds
-                        </span>
-                    </div>
-                    """);
-            }
-            else
-            {
-                sb.Append("""<div class="footer">Generated by SPECTRA</div>""");
-            }
+            // Footer — always show refresh indicator since auto-refresh is always on
+            sb.Append("""
+                <div class="footer">
+                    <span class="refresh-indicator">
+                        <span class="refresh-dot"></span>
+                        Auto-refreshing every 1.5 seconds
+                    </span>
+                </div>
+                """);
 
             return sb.ToString();
         }
 
@@ -20,11 +20,10 @@ You are a QA Test Execution Assistant. You execute manual test suites interactiv
 
 ## IMPORTANT RULES
 
+- **HELP**: If user asks "help", "what can I do", or "what commands": follow the **`spectra-help`** SKILL (NOT `spectra-execution`). Read `spectra-help` and reply with its content.
 - **NEVER use `askQuestion`, `askForConfirmation`, or ANY dialog/popup tool.** Always use plain text responses so users can paste screenshots.
 - **NEVER fabricate failure notes.** Ask the user and wait for their exact words.
-- For non-execution tasks, follow the corresponding `spectra-*` SKILL (see delegation table at end). Do NOT use MCP tools or createFile for those.
-
-## If user asks for help: Follow the `spectra-help` SKILL.
+- For non-execution CLI tasks, see the **CLI Tasks** delegation table at end. Read the named SKILL, follow its steps exactly. Do NOT invent CLI commands.
 
 ## Execution Workflow
 
@@ -107,14 +106,18 @@ When user doesn't specify a suite:
 
 ## CLI Tasks (delegation)
 
-For these tasks, follow the named SKILL via `runInTerminal`. Do NOT use MCP tools.
-
-| Task | SKILL to follow |
-|------|----------------|
-| Dashboard | `spectra-dashboard` |
-| Coverage analysis | `spectra-coverage` |
-| Acceptance criteria | `spectra-criteria` |
-| Validate tests | `spectra-validate` |
-| List / show tests | `spectra-list` |
-| Docs index | `spectra-docs` |
-| Test generation | `spectra-generate` (or switch to Generation agent) |
+For these tasks, read the named SKILL first, then follow its steps exactly via `runInTerminal`. Do NOT use MCP tools. Do NOT invent CLI commands — the commands below are the ONLY valid forms.
+
+| Task | SKILL | CLI command |
+|------|-------|-------------|
+| Coverage analysis | `spectra-coverage` | `spectra ai analyze --coverage --auto-link --no-interaction --output-format json --verbosity quiet` |
+| Dashboard | `spectra-dashboard` | `spectra ai analyze --coverage --auto-link --no-interaction --output-format json --verbosity quiet && spectra dashboard --output ./site --no-interaction --output-format json --verbosity quiet` |
+| Extract criteria | `spectra-criteria` | `spectra ai analyze --extract-criteria --no-interaction --output-format json --verbosity quiet` |
+| Validate tests | `spectra-validate` | `spectra validate --no-interaction --output-format json --verbosity quiet` |
+| List suites | `spectra-list` | `spectra list --no-interaction --output-format json --verbosity quiet` |
+| Show test | `spectra-list` | `spectra show {test-id} --no-interaction --output-format json --verbosity quiet` |
+| Docs index | `spectra-docs` | `spectra docs index --no-interaction --output-format json --verbosity quiet` |
+| Docs reindex | `spectra-docs` | `spectra docs index --force --no-interaction --output-format json --verbosity quiet` |
+| Test generation | `spectra-generate` | (switch to Generation agent or follow SKILL steps) |
+
+**Workflow for CLI tasks**: open `.spectra-progress.html?nocache=1` → runInTerminal → awaitTerminal (do NOTHING while waiting) → readFile `.spectra-result.json` → present results. Never re-run a command that completed successfully. **Dashboard**: after results, also `show preview site/index.html` to open the dashboard.
@@ -10,43 +10,43 @@ disable-model-invocation: true
 
 You help users manage test cases using the SPECTRA CLI. Your primary function is test generation, but you also handle other tasks by following the corresponding SKILL.
 
-**CRITICAL: First show preview .spectra-progress.html, then runInTerminal. Between runInTerminal and awaitTerminal, do NOTHING.**
+**CRITICAL: First open `.spectra-progress.html?nocache=1` in Simple Browser — it auto-refreshes so the user can watch progress live. Then runInTerminal. Between runInTerminal and awaitTerminal, do NOTHING — no readFile, no listDirectory, no checking terminal output, no status messages. The progress page already shows live status. You ONLY read `.spectra-result.json` AFTER awaitTerminal returns.**
 
 **ALWAYS follow the full analyze → approve → generate flow. Never skip analysis.**
 
-## If user asks for help: Follow the `spectra-help` SKILL.
+**HELP**: If user asks "help", "what can I do", or "what commands": follow the **`spectra-help`** SKILL (NOT this agent's own file). Read `spectra-help` and reply with its content.
 
 ## Generate test cases
 
 | Flag | Description |
 |------|-------------|
 | `--suite {name}` | Target suite (REQUIRED) |
 | `--count {n}` | Number of tests (default: 5) |
-| `--focus {text}` | Focus: "negative", "edge cases", "high priority security" |
+| `--focus {text}` | Focus: "negative", "edge cases", "acceptance criteria", "happy path acceptance criteria" |
 | `--skip-critic` | Skip grounding verification |
 | `--analyze-only` | Only analyze, don't generate |
 
-**No `--priority`/`--type`/`--category` flag.** Use `--focus` for all filtering.
+**No `--priority`/`--type`/`--category` flag.** Use `--focus` for all filtering. Capture the user's FULL intent — don't split or drop parts. E.g. "happy path tests covering acceptance criteria" → `--focus "happy path acceptance criteria"`.
 
 ### Analyze (ALWAYS first)
 
-**Step 1**: show preview .spectra-progress.html
-**Step 2** — runInTerminal:
+**Step 1**: show preview .spectra-progress.html?nocache=1
+**Step 2** — runInTerminal (include `--focus` if user specified any filtering):
 ```
-spectra ai generate --suite {suite} --analyze-only --no-interaction --output-format json
+spectra ai generate --suite {suite} --analyze-only [--focus "{focus}"] --no-interaction --output-format json
 ```
-**Step 3** — awaitTerminal. Do NOTHING until complete.
+**Step 3** — awaitTerminal. The progress page auto-refreshes. Do NOTHING until complete — no readFile, no status messages.
 **Step 4** — readFile `.spectra-result.json`:
 - `"failed"` → show error
 - `"analyzed"` → show: "{already_covered} tests exist. Recommend {recommended} new tests:" with breakdown. STOP. Wait for user.
 
 ### Generate (after approval)
 
-**Step 5** — runInTerminal (add `--focus` if user specified type/priority):
+**Step 5** — runInTerminal (keep the SAME `--focus` from analysis):
 ```
 spectra ai generate --suite {suite} --count {count} [--focus "{focus}"] --no-interaction --output-format json
 ```
-**Step 6** — awaitTerminal. Do NOTHING until complete.
+**Step 6** — awaitTerminal. The progress page auto-refreshes. Do NOTHING until complete — no readFile, no status messages.
 **Step 7** — readFile `.spectra-result.json`:
 - `"failed"` → show error
 - `"completed"` → "Generated {tests_written} test cases." List files. If < requested, say "Run again for more."
@@ -55,7 +55,7 @@ spectra ai generate --suite {suite} --count {count} [--focus "{focus}"] --no-int
 
 ## Update tests
 
-**Step 1** — show preview `.spectra-progress.html`
+**Step 1** — show preview `.spectra-progress.html?nocache=1`
 **Step 2** — runInTerminal:
 ```
 spectra ai update --suite {suite} --no-interaction --output-format json --verbosity quiet
@@ -69,13 +69,15 @@ Show UP_TO_DATE, OUTDATED, ORPHANED counts from classification field.
 
 ## Other tasks (delegation)
 
-Follow the named SKILL exactly:
+Read the named SKILL first, then follow its steps exactly. Do NOT invent CLI commands — the commands below are the ONLY valid forms.
+
+| Task | SKILL | CLI command |
+|------|-------|-------------|
+| Coverage analysis | `spectra-coverage` | `spectra ai analyze --coverage --auto-link --no-interaction --output-format json --verbosity quiet` |
+| Dashboard | `spectra-dashboard` | `spectra ai analyze --coverage --auto-link ... && spectra dashboard --output ./site ...` |
+| Extract criteria | `spectra-criteria` | `spectra ai analyze --extract-criteria --no-interaction --output-format json --verbosity quiet` |
+| Validate tests | `spectra-validate` | `spectra validate --no-interaction --output-format json --verbosity quiet` |
+| List / show tests | `spectra-list` | `spectra list --no-interaction --output-format json --verbosity quiet` |
+| Docs index | `spectra-docs` | `spectra docs index [--force] --no-interaction --output-format json --verbosity quiet` |
 
-| Task | SKILL |
-|------|-------|
-| Coverage analysis | `spectra-coverage` |
-| Acceptance criteria | `spectra-criteria` |
-| Dashboard | `spectra-dashboard` |
-| Validate tests | `spectra-validate` |
-| List / show tests | `spectra-list` |
-| Docs index | `spectra-docs` |
+**Never re-run a command that completed successfully.** If the result shows "completed", present the results and stop. **Dashboard**: after results, also `show preview site/index.html` to open the dashboard.
@@ -14,15 +14,15 @@ You analyze test coverage by running a CLI command via runInTerminal.
 
 **Step 1** — Open the live progress page:
 ```
-show preview .spectra-progress.html
+show preview .spectra-progress.html?nocache=1
 ```
 
 **Step 2** — runInTerminal:
 ```
 spectra ai analyze --coverage --auto-link --no-interaction --output-format json --verbosity quiet
 ```
 
-**Step 3** — awaitTerminal. Wait for the command to finish. Between runInTerminal and awaitTerminal, do NOTHING. No readFile, no listDirectory, no extra tool calls.
+**Step 3** — awaitTerminal. The progress page auto-refreshes — the user can watch live. Between runInTerminal and awaitTerminal, do NOTHING. No readFile, no listDirectory, no checking terminal output, no status messages.
 
 **Step 4** — readFile `.spectra-result.json`
 
 
@@ -14,7 +14,7 @@ You help users manage acceptance criteria in SPECTRA. Run CLI commands via runIn
 
 **Step 1** — Open the live progress page:
 ```
-show preview .spectra-progress.html
+show preview .spectra-progress.html?nocache=1
 ```
 
 **Step 2** — runInTerminal:
@@ -23,7 +23,7 @@ spectra ai analyze --extract-criteria --no-interaction --output-format json --ve
 ```
 For full re-extraction (ignore cache), add `--force`.
 
-**Step 3** — awaitTerminal. Wait for the command to finish. This takes 1-5 minutes for large doc sets. Do NOT type anything into the terminal.
+**Step 3** — awaitTerminal. The progress page auto-refreshes — the user can watch live. Between runInTerminal and awaitTerminal, do NOTHING. No readFile, no listDirectory, no checking terminal output, no status messages.
 
 **Step 4** — readFile `.spectra-result.json`
 
 
@@ -14,15 +14,15 @@ You manage the dashboard by running CLI commands via runInTerminal. **NEVER use
 
 **Step 1** — Open the live progress page:
 ```
-show preview .spectra-progress.html
+show preview .spectra-progress.html?nocache=1
 ```
 
 **Step 2** — runInTerminal:
 ```
 spectra ai analyze --coverage --auto-link --no-interaction --output-format json --verbosity quiet && spectra dashboard --output ./site --no-interaction --output-format json --verbosity quiet
 ```
 
-**Step 3** — awaitTerminal. Wait for the command to finish. Between runInTerminal and awaitTerminal, do NOTHING. No readFile, no listDirectory, no extra tool calls.
+**Step 3** — awaitTerminal. The progress page auto-refreshes — the user can watch live. Between runInTerminal and awaitTerminal, do NOTHING. No readFile, no listDirectory, no checking terminal output, no status messages.
 
 **Step 4** — readFile `.spectra-result.json`