From 36edd705bfa36f1443ac03149063a2729d02090d Mon Sep 17 00:00:00 2001
From: Vladyslav <v.mykytenko@studytube.nl>
Date: Thu, 2 Apr 2026 14:13:00 +0300
Subject: [PATCH 1/2] Fixed nullish error for openAI models, actualized config
 generator, added Makefile

---
 Makefile             |  6 +++++
 bin/explorbot-cli.ts | 63 +++++++++++++++++++++++++++++++++-----------
 bun.lock             |  6 ++++-
 src/ai/pilot.ts      | 24 ++++++++++++-----
 src/ai/planner.ts    | 16 ++++++++---
 5 files changed, 89 insertions(+), 26 deletions(-)
 create mode 100644 Makefile
diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000..aeb7bbc
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,6 @@
+start:
+	./bin/explorbot-cli.ts start
+
+init:
+	./bin/explorbot-cli.ts init
+	
\ No newline at end of file
diff --git a/bin/explorbot-cli.ts b/bin/explorbot-cli.ts
index 8dc75fa..f5c575e 100755
--- a/bin/explorbot-cli.ts
+++ b/bin/explorbot-cli.ts
@@ -144,7 +144,10 @@ addCommonOptions(program.command('plan <path> [feature]').description('Generate
         }
       }
 
-      await explorBot.plan(feature || undefined, { fresh: !options.append, style: options.style });
+      await explorBot.plan(feature || undefined, {
+        fresh: !options.append,
+        style: options.style,
+      });
 
       const plan = explorBot.getCurrentPlan();
       if (!plan?.tests.length) {
@@ -320,7 +323,13 @@ program
       log(`Working in directory: ${resolvedPath}`);
     }
 
-    const defaultConfig = `import { <your provider here> } from 'ai';
+    const defaultConfig = `import { '<your provider here>' } from '<your provider package here>';
+
+// This example uses OpenRouter (one API key, many providers). Any Vercel AI SDK provider works; see
+// https://github.com/testomatio/explorbot/blob/main/docs/providers.md
+const openrouter = createOpenRouter({
+  apiKey: process.env.OPENROUTER_API_KEY,
+});
 
 const config = {
   playwright: {
@@ -330,9 +339,9 @@ const config = {
   },
 
   ai: {
-    provider: <your provider here>,
     model: '<your model here>',
-    apiKey: '<your api key here>',
+    visionModel: '<your vision model here>',
+    agenticModel: '<your agentic model here>',
   },
 
   reporter: {
@@ -470,7 +479,9 @@ program
   .option('-p, --path <path>', 'Working directory path')
   .action(async (url, description, options) => {
     try {
-      await ConfigParser.getInstance().loadConfig({ path: options.path || process.cwd() });
+      await ConfigParser.getInstance().loadConfig({
+        path: options.path || process.cwd(),
+      });
 
       if (url && description) {
         const { KnowledgeTracker } = await import('../src/knowledge-tracker.js');
@@ -498,7 +509,9 @@ program
   .option('-p, --path <path>', 'Working directory path')
   .action(async (url, options) => {
     try {
-      await ConfigParser.getInstance().loadConfig({ path: options.path || process.cwd() });
+      await ConfigParser.getInstance().loadConfig({
+        path: options.path || process.cwd(),
+      });
       const { KnowsCommand } = await import('../src/commands/knows-command.js');
       const explorBot = new ExplorBot({ path: options.path });
       const command = new KnowsCommand(explorBot);
@@ -648,14 +661,20 @@ browserCmd
   .option('-p, --path <path>', 'Working directory path')
   .action(async (options) => {
     const { launchServer, removeEndpointFile } = await import('../src/browser-server.js');
-    await ConfigParser.getInstance().loadConfig({ config: options.config, path: options.path });
+    await ConfigParser.getInstance().loadConfig({
+      config: options.config,
+      path: options.path,
+    });
     const config = ConfigParser.getInstance().getConfig();
 
     let show = config.playwright.show || false;
     if (options.show !== undefined) show = true;
     if (options.headless !== undefined) show = false;
 
-    const server = await launchServer({ browser: config.playwright.browser, show });
+    const server = await launchServer({
+      browser: config.playwright.browser,
+      show,
+    });
 
     console.log('Browser server is running. Press Ctrl+C to stop.');
 
@@ -677,7 +696,10 @@ browserCmd
   .option('-p, --path <path>', 'Working directory path')
   .action(async (options) => {
     const { getAliveEndpoint, removeEndpointFile } = await import('../src/browser-server.js');
-    await ConfigParser.getInstance().loadConfig({ config: options.config, path: options.path });
+    await ConfigParser.getInstance().loadConfig({
+      config: options.config,
+      path: options.path,
+    });
 
     const endpoint = await getAliveEndpoint();
     if (!endpoint) {
@@ -702,7 +724,10 @@ browserCmd
   .option('-p, --path <path>', 'Working directory path')
   .action(async (options) => {
     const { getAliveEndpoint } = await import('../src/browser-server.js');
-    await ConfigParser.getInstance().loadConfig({ config: options.config, path: options.path });
+    await ConfigParser.getInstance().loadConfig({
+      config: options.config,
+      path: options.path,
+    });
 
     const endpoint = await getAliveEndpoint();
     if (endpoint) {
@@ -743,15 +768,23 @@ program
 
     if (agent && name) {
       const { AddRuleCommand } = await import('../src/commands/add-rule-command.js');
-      const result = AddRuleCommand.createRuleFile(agent, name, { urlPattern: options.url });
+      const result = AddRuleCommand.createRuleFile(agent, name, {
+        urlPattern: options.url,
+      });
       process.exit(result ? 0 : 1);
     }
 
     const AddRule = (await import('../src/components/AddRule.js')).default;
-    render(React.createElement(AddRule, { initialAgent: agent || '', initialName: name || '' }), {
-      exitOnCtrlC: false,
-      patchConsole: false,
-    });
+    render(
+      React.createElement(AddRule, {
+        initialAgent: agent || '',
+        initialName: name || '',
+      }),
+      {
+        exitOnCtrlC: false,
+        patchConsole: false,
+      }
+    );
   });
 
 import { createApiCommands } from '../boat/api-tester/src/cli.ts';
diff --git a/bun.lock b/bun.lock
index 7c83b2a..fc675d5 100644
--- a/bun.lock
+++ b/bun.lock
@@ -83,7 +83,7 @@
 
     "@ai-sdk/groq": ["@ai-sdk/groq@3.0.2", "", { "dependencies": { "@ai-sdk/provider": "3.0.1", "@ai-sdk/provider-utils": "4.0.2" }, "peerDependencies": { "zod": "^3.25.76 || ^4.1.8" } }, "sha512-Gs7Ir9cUSYlbDIArNMt3+0Ql+OrEKELQhYfji5CCxQ8MdcJGbhbyPf9AQralu9PMxq/QEy2JSOgYW5zOnHDd2g=="],
 
-    "@ai-sdk/openai": ["@ai-sdk/openai@3.0.2", "", { "dependencies": { "@ai-sdk/provider": "3.0.1", "@ai-sdk/provider-utils": "4.0.2" }, "peerDependencies": { "zod": "^3.25.76 || ^4.1.8" } }, "sha512-GONwavgSWtcWO+t9+GpGK8l7nIYh+zNtCL/NYDSeHxHiw6ksQS9XMRWrZyE5NpJ0EXNxSAWCHIDmb1WvTqhq9Q=="],
+    "@ai-sdk/openai": ["@ai-sdk/openai@3.0.49", "", { "dependencies": { "@ai-sdk/provider": "3.0.8", "@ai-sdk/provider-utils": "4.0.21" }, "peerDependencies": { "zod": "^3.25.76 || ^4.1.8" } }, "sha512-U2f0pCyNn/jQH3wjgxr8o9VvCkuDFTtXbIhbFFtgXqCzMbed6rBnvzQcAMEK0/Pa44byL9zfcvCOFOflvkRA8w=="],
 
     "@ai-sdk/provider": ["@ai-sdk/provider@3.0.1", "", { "dependencies": { "json-schema": "^0.4.0" } }, "sha512-2lR4w7mr9XrydzxBSjir4N6YMGdXD+Np1Sh0RXABh7tWdNFFwIeRI1Q+SaYZMbfL8Pg8RRLcrxQm51yxTLhokg=="],
 
@@ -2653,6 +2653,10 @@
 
     "zone.js": ["zone.js@0.15.1", "", {}, "sha512-XE96n56IQpJM7NAoXswY3XRLcWFW83xe0BiAOeMD7K5k5xecOeul3Qcpx6GqEeeHNkW5DWL5zOyTbEfB4eti8w=="],
 
+    "@ai-sdk/openai/@ai-sdk/provider": ["@ai-sdk/provider@3.0.8", "", { "dependencies": { "json-schema": "^0.4.0" } }, "sha512-oGMAgGoQdBXbZqNG0Ze56CHjDZ1IDYOwGYxYjO5KLSlz5HiNQ9udIXsPZ61VWaHGZ5XW/jyjmr6t2xz2jGVwbQ=="],
+
+    "@ai-sdk/openai/@ai-sdk/provider-utils": ["@ai-sdk/provider-utils@4.0.21", "", { "dependencies": { "@ai-sdk/provider": "3.0.8", "@standard-schema/spec": "^1.1.0", "eventsource-parser": "^3.0.6" }, "peerDependencies": { "zod": "^3.25.76 || ^4.1.8" } }, "sha512-MtFUYI1/8mgDvRmaBDjbLJPFFrMG777AvSgyIFQtZHIMzm88R/12vYBBpnk7pfiWLFE1DSZzY4WDYzGbKAcmiw=="],
+
     "@aws-crypto/sha1-browser/@smithy/util-utf8": ["@smithy/util-utf8@2.3.0", "", { "dependencies": { "@smithy/util-buffer-from": "^2.2.0", "tslib": "^2.6.2" } }, "sha512-R8Rdn8Hy72KKcebgLiv8jQcQkXoLMOGGv5uI1/k0l+snqkOzQ1R0ChUBCxWMlBsFMekWjq0wRudIweFs7sKT5A=="],
 
     "@aws-crypto/sha256-browser/@smithy/util-utf8": ["@smithy/util-utf8@2.3.0", "", { "dependencies": { "@smithy/util-buffer-from": "^2.2.0", "tslib": "^2.6.2" } }, "sha512-R8Rdn8Hy72KKcebgLiv8jQcQkXoLMOGGv5uI1/k0l+snqkOzQ1R0ChUBCxWMlBsFMekWjq0wRudIweFs7sKT5A=="],
diff --git a/src/ai/pilot.ts b/src/ai/pilot.ts
index 8f815a2..c223767 100644
--- a/src/ai/pilot.ts
+++ b/src/ai/pilot.ts
@@ -85,7 +85,7 @@ export class Pilot implements Agent {
     const schema = z.object({
       decision: z.enum(['pass', 'fail', 'continue', 'skipped']).describe('pass = test succeeded, fail = test failed, continue = tester should keep going, skipped = scenario is irrelevant OR systematic execution failures prevented testing'),
       reason: z.string().describe('What happened and why (1-2 sentences). Do NOT repeat the decision status (e.g. "scenario goal achieved/not achieved") — just explain the evidence. For continue: explain why rejected and suggest alternatives.'),
-      guidance: z.string().nullish().describe('Required for "continue": specific actionable instruction for the tester — what exactly to verify, retry differently, or complete next. Be concrete.'),
+      guidance: z.string().nullable().describe('Required for "continue": specific actionable instruction for the tester — what exactly to verify, retry differently, or complete next. Be concrete.'),
     });
 
     const userContent = dedent`
@@ -117,12 +117,18 @@ export class Pilot implements Agent {
     `;
 
     const messages = [
-      { role: 'system' as const, content: this.buildVerdictSystemPrompt(type, task) },
+      {
+        role: 'system' as const,
+        content: this.buildVerdictSystemPrompt(type, task),
+      },
       { role: 'user' as const, content: userContent },
     ];
 
     try {
-      const response = await this.provider.generateObject(messages, schema, this.provider.getAgenticModel('pilot'), { agentName: 'pilot', experimental_telemetry: { functionId: 'pilot.reviewVerdict' } });
+      const response = await this.provider.generateObject(messages, schema, this.provider.getAgenticModel('pilot'), {
+        agentName: 'pilot',
+        experimental_telemetry: { functionId: 'pilot.reviewVerdict' },
+      });
 
       const result = response?.object;
       if (!result) {
@@ -222,7 +228,9 @@ export class Pilot implements Agent {
   async planTest(task: Test, currentState: ActionResult): Promise<string> {
     tag('substep').log('Pilot planning test...');
 
-    const pageSummary = await this.researcher.summary(currentState, { allowNewResearch: false });
+    const pageSummary = await this.researcher.summary(currentState, {
+      allowNewResearch: false,
+    });
     const agenticModel = this.provider.getAgenticModel('pilot');
     this.conversation = this.provider.startConversation(this.getSystemPrompt(task, currentState, pageSummary), 'pilot', agenticModel);
 
@@ -257,7 +265,9 @@ export class Pilot implements Agent {
 
     tag('substep').log('Pilot reviewing new page...');
 
-    const pageSummary = await this.researcher.summary(currentState, { allowNewResearch: false });
+    const pageSummary = await this.researcher.summary(currentState, {
+      allowNewResearch: false,
+    });
     if (!pageSummary) return '';
 
     const stateContext = this.buildStateContext(currentState);
@@ -289,7 +299,9 @@ export class Pilot implements Agent {
     tag('substep').log('Pilot analyzing progress...');
 
     if (!this.conversation) {
-      const pageSummary = await this.researcher.summary(currentState, { allowNewResearch: false });
+      const pageSummary = await this.researcher.summary(currentState, {
+        allowNewResearch: false,
+      });
       const agenticModel = this.provider.getAgenticModel('pilot');
       this.conversation = this.provider.startConversation(this.getSystemPrompt(task, currentState, pageSummary), 'pilot', agenticModel);
     }
diff --git a/src/ai/planner.ts b/src/ai/planner.ts
index 78f92e4..db912fd 100644
--- a/src/ai/planner.ts
+++ b/src/ai/planner.ts
@@ -32,7 +32,7 @@ const TasksSchema = z.object({
       z.object({
         scenario: z.string().describe('A single sentence describing what to test'),
         priority: z.enum(['critical', 'important', 'high', 'normal', 'low']).describe('Priority of the task based on business importance'),
-        startUrl: z.string().optional().describe('Start URL for the test if different from plan URL (only for tests on visited subpages)'),
+        startUrl: z.string().nullable().describe('Start URL for the test if different from plan URL (only for tests on visited subpages)'),
         steps: z.array(z.string()).describe('List of steps to perform for this scenario. Each step should be a specific action (e.g., "Click on Login button", "Enter username in email field", "Submit the form"). Keep steps atomic and actionable.'),
         expectedOutcomes: z
           .array(z.string())
@@ -325,13 +325,18 @@ export class Planner extends PlannerBase implements Agent {
 
     conversation.addUserText(planningPrompt);
     const currentState = this.stateManager.getCurrentState();
-    const research = await this.researcher.research(currentState || state, { deep: true });
+    const research = await this.researcher.research(currentState || state, {
+      deep: true,
+    });
     let plannerResearch = mdq(research).query('code').replace('');
     for (const table of mdq(plannerResearch).query('table').each()) {
       const rawTable = table.text();
       const rows = table.toJson();
       if (rows.length === 0 || !rows[0].Element) continue;
-      const elementWithType = rows.map((r) => ({ Element: r.Element, Type: r.Type || '' }));
+      const elementWithType = rows.map((r) => ({
+        Element: r.Element,
+        Type: r.Type || '',
+      }));
       plannerResearch = plannerResearch.replace(rawTable, jsonToTable(elementWithType, ['Element', 'Type']));
     }
 
@@ -349,7 +354,10 @@ export class Planner extends PlannerBase implements Agent {
       </page_research>
     `);
 
-    const rawFlows = this.experienceTracker.getSuccessfulExperience(state, { includeDescendants: true, stripCode: true });
+    const rawFlows = this.experienceTracker.getSuccessfulExperience(state, {
+      includeDescendants: true,
+      stripCode: true,
+    });
     const flows = rawFlows.map((f) => this.cleanExperienceFlows(f)).filter(Boolean) as string[];
     if (flows.length > 0) {
       conversation.addUserText(dedent`

From a218ec5576179ddded350fc7db028c2e926972b6 Mon Sep 17 00:00:00 2001
From: Vladyslav <v.mykytenko@studytube.nl>
Date: Sun, 5 Apr 2026 15:00:15 +0300
Subject: [PATCH 2/2] Update docs according to CHANGELOG.md

---
 bun.lock              |   6 +-
 docs/agents.md        |  25 ++++-
 docs/commands.md      | 239 ++++++++++++++++++++++++++++++++++++------
 docs/configuration.md | 220 ++++++++++++++++++++++++++------------
 docs/planner.md       |  64 ++++++-----
 docs/researcher.md    |  95 ++++++++++-------
 package.json          |  12 ++-
 7 files changed, 487 insertions(+), 174 deletions(-)

diff --git a/bun.lock b/bun.lock
index fc675d5..e9b4567 100644
--- a/bun.lock
+++ b/bun.lock
@@ -7,7 +7,7 @@
       "dependencies": {
         "@ai-sdk/anthropic": "^3.0",
         "@ai-sdk/groq": "^3.0",
-        "@ai-sdk/openai": "^3.0",
+        "@ai-sdk/openai": "^3.0.49",
         "@axe-core/playwright": "^4.11.0",
         "@inkjs/ui": "^2.0.0",
         "@langfuse/otel": "^4.5.1",
@@ -20,7 +20,7 @@
         "@opentelemetry/sdk-trace-base": "^2.2.0",
         "@opentelemetry/semantic-conventions": "^1.38.0",
         "@scalar/openapi-parser": "^0.25.6",
-        "@testomatio/reporter": "2.7.3",
+        "@testomatio/reporter": "2.7.6",
         "ai": "^6.0.6",
         "axe-core": "^4.11.1",
         "bash-tool": "^1.3.15",
@@ -919,7 +919,7 @@
 
     "@testing-library/react": ["@testing-library/react@16.3.0", "", { "dependencies": { "@babel/runtime": "^7.12.5" }, "peerDependencies": { "@testing-library/dom": "^10.0.0", "@types/react": "^18.0.0 || ^19.0.0", "@types/react-dom": "^18.0.0 || ^19.0.0", "react": "^18.0.0 || ^19.0.0", "react-dom": "^18.0.0 || ^19.0.0" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-kFSyxiEDwv1WLl2fgsq6pPBbw5aWKrsY2/noi1Id0TK0UParSF62oFQFGHXIyaG4pp2tEub/Zlel+fjjZILDsw=="],
 
-    "@testomatio/reporter": ["@testomatio/reporter@2.7.3", "", { "dependencies": { "@aws-sdk/client-s3": "^3.279.0", "@aws-sdk/lib-storage": "^3.279.0", "@cucumber/cucumber": "^10.9.0", "@octokit/rest": "^21.1.1", "aws-sdk": "^2.1072.0", "callsite-record": "^4.1.4", "commander": "^12", "cross-spawn": "^7.0.3", "csv-writer": "^1.6.0", "debug": "4.3.4", "dotenv": "^16.0.1", "fast-xml-parser": "^5.3.4", "file-url": "3.0.0", "filesize": "^10.1.6", "gaxios": ">=6.0 || >=7.0.0-rc.4 || <8", "glob": "^10.3", "handlebars": "^4.7.8", "has-flag": "^5.0.1", "humanize-duration": "^3.27.3", "is-valid-path": "^0.1.1", "js-yaml": "^4.1.1", "json-cycle": "^1.3.0", "lodash.memoize": "^4.1.2", "lodash.merge": "^4.6.2", "minimatch": "^10.2.4", "picocolors": "^1.0.1", "pretty-ms": "^7.0.1", "promise-retry": "^2.0.1", "strip-ansi": "7.1.0", "uuid": "^9.0.0" }, "bin": { "report-xml": "src/bin/reportXml.js", "start-test-run": "src/bin/startTest.js", "upload-artifacts": "src/bin/uploadArtifacts.js", "reporter": "src/bin/cli.js" } }, "sha512-ytrKPVPeQ7PkA/BfTkkkNMs4QlUQ/ZwFZhSsrxIN8SAph6M9GG1gjjUuft7hrwAgN2aWZkDyp8CL0eYe6czHYg=="],
+    "@testomatio/reporter": ["@testomatio/reporter@2.7.6", "", { "dependencies": { "@aws-sdk/client-s3": "^3.279.0", "@aws-sdk/lib-storage": "^3.279.0", "@cucumber/cucumber": "^10.9.0", "@octokit/rest": "^21.1.1", "aws-sdk": "^2.1072.0", "callsite-record": "^4.1.4", "commander": "^12", "cross-spawn": "^7.0.3", "csv-writer": "^1.6.0", "debug": "4.3.4", "dotenv": "^16.0.1", "fast-xml-parser": "^5.3.4", "file-url": "3.0.0", "filesize": "^10.1.6", "gaxios": ">=6.0 || >=7.0.0-rc.4 || <8", "glob": "^10.3", "handlebars": "^4.7.8", "has-flag": "^5.0.1", "humanize-duration": "^3.27.3", "is-valid-path": "^0.1.1", "js-yaml": "^4.1.1", "json-cycle": "^1.3.0", "lodash.memoize": "^4.1.2", "lodash.merge": "^4.6.2", "minimatch": "^10.2.4", "picocolors": "^1.0.1", "pretty-ms": "^7.0.1", "promise-retry": "^2.0.1", "strip-ansi": "7.1.0", "uuid": "^9.0.0" }, "bin": { "report-xml": "src/bin/reportXml.js", "start-test-run": "src/bin/startTest.js", "upload-artifacts": "src/bin/uploadArtifacts.js", "reporter": "src/bin/cli.js" } }, "sha512-Q7onX+TBqXGfeANSRTEfPUl/T4l7kJTjSfOWBKEJvD4aVRAaCH1L+psnsHkQr8i9IzGtHowoGJlBeCzGNfiMCg=="],
 
     "@tokenizer/inflate": ["@tokenizer/inflate@0.4.1", "", { "dependencies": { "debug": "^4.4.3", "token-types": "^6.1.1" } }, "sha512-2mAv+8pkG6GIZiF1kNg1jAjh27IDxEPKwdGul3snfztFerfPGI1LjDezZp3i7BElXompqEtPmoPx6c2wgtWsOA=="],
 
diff --git a/docs/agents.md b/docs/agents.md
index b2aa7ed..ae18af8 100644
--- a/docs/agents.md
+++ b/docs/agents.md
@@ -19,17 +19,20 @@ flowchart LR
 **Purpose:** Handles all browser interactions — clicks, form fills, navigation.
 
 **What it does:**
+
 - Executes CodeceptJS commands in the browser
 - Tries multiple locator strategies when selectors fail
 - Automatically resolves failed interactions without stopping
 - Remembers what worked (and what didn't) for next time
 
 **Why you'll love it:**
+
 - No more `ElementNotFound` exceptions killing your test runs
 - Self-healing when your UI changes
 - Learns optimal selectors for your specific app
 
 **Commands that use Navigator:**
+
 - `/navigate <target>`
 - `I.click()`, `I.fillField()`, `I.amOnPage()`, etc.
 
@@ -38,6 +41,7 @@ flowchart LR
 **Purpose:** Analyzes pages to understand what's actually there.
 
 **What it does:**
+
 - Discovers all interactive UI elements
 - Expands hidden content (accordions, dropdowns, modals)
 - Maps navigation paths and form structures
@@ -45,12 +49,14 @@ flowchart LR
 - Filters out irrelevant elements (cookie banners, ads)
 
 **Why you'll love it:**
+
 - Discovers UI elements you forgot existed
 - Gives you a complete picture of what's testable
 - Documents forms with all their validation rules
 - Configurable filtering to focus on what matters
 
 **Commands that use Researcher:**
+
 - `explorbot research /path` (CLI)
 - `/research [path]` (TUI)
 - `/research --deep` — expand hidden elements
@@ -63,6 +69,7 @@ See [Researcher Agent](./researcher.md) for detailed configuration and usage.
 **Purpose:** Generates test scenarios from research findings.
 
 **What it does:**
+
 - Creates business-focused test scenarios
 - Assigns priority levels (critical/important/high/normal/low)
 - Generates expected outcomes for verification
@@ -71,12 +78,14 @@ See [Researcher Agent](./researcher.md) for detailed configuration and usage.
 - Cycles through planning styles (normal, psycho, curious) for comprehensive coverage
 
 **Why you'll love it:**
+
 - Creates tests that matter, not just "click stuff"
 - Prioritizes by risk (critical flows first)
 - Different styles ensure broad coverage over multiple iterations
 - Fully customizable — add your own styles and page-specific rules
 
 **Commands that use Planner:**
+
 - `/plan [feature]`
 - `/explore`
 
@@ -87,6 +96,7 @@ See [Planner Agent](./planner.md) for detailed documentation on planning styles,
 **Purpose:** Executes the planned scenarios.
 
 **What it does:**
+
 - Runs test scenarios step by step
 - Adapts when things don't go as expected
 - Tracks state changes during execution
@@ -94,11 +104,13 @@ See [Planner Agent](./planner.md) for detailed documentation on planning styles,
 - Uses research context for smart decisions
 
 **Why you'll love it:**
+
 - Handles unexpected modals and popups
 - Recovers from minor failures automatically
 - Produces detailed execution logs
 
 **Commands that use Tester:**
+
 - `/test [scenario]`
 - `/explore`
 
@@ -107,31 +119,37 @@ See [Planner Agent](./planner.md) for detailed documentation on planning styles,
 **Purpose:** Supervises Tester and intervenes when tests get stuck.
 
 **What it does:**
+
 - Maintains separate conversation to track test progress over time
 - Detects stuck patterns (loops, repeated failures, no page changes)
 - Decides what context Tester needs (HTML, ARIA, UI map)
 - Asks user for help when automated recovery fails
 
 **Why you'll love it:**
+
 - Catches when Tester is spinning wheels on the same failure
 - Requests user input before giving up on a test
 - Can use smarter models without token cost explosion (only sees tool summaries, not raw HTML)
 
 **When Pilot intervenes:**
+
 - Actions succeed but page doesn't change (wrong element)
 - Same action repeated multiple times (loop)
 - Same locator keeps failing (need alternative approach)
 - Only research/context calls, no action tools (not progressing)
 
-## Captain Agent *(coming soon)*
+## Captain Agent
 
-**Purpose:** Orchestrates the whole testing session.
+**Purpose:** Orchestrates the whole testing session and handles user commands in TUI.
 
 **What it does:**
-- Coordinates all agents intelligently
+
 - Responds to user commands in real-time
 - Adjusts strategy based on discoveries
 - Manages conversation context efficiently
+- Runs in idle mode with access to diagnostic tools
+- Inspects test sessions (logs, tool calls, ARIA states, pilot analysis)
+- Reads/writes files, evaluates browser JS, manages tabs
 
 ## Per-Agent Model Configuration
 
@@ -157,6 +175,7 @@ export default {
 ```
 
 **Typical optimization:**
+
 - Navigator needs fast responses for real-time interaction
 - Researcher benefits from vision capabilities
 - Planner can use a slightly larger model for better test design
diff --git a/docs/commands.md b/docs/commands.md
index d37b158..3ab04ee 100644
--- a/docs/commands.md
+++ b/docs/commands.md
@@ -9,13 +9,16 @@ Explorbot has two types of commands:
 
 Some commands work in both modes. Where a CLI equivalent exists, it is noted below.
 
-| TUI Command | CLI Equivalent |
-|-------------|---------------|
-| `/explore [url]` | `explorbot explore [path]` |
-| `/research [url]` | `explorbot research <url>` |
-| `/plan [feature]` | `explorbot plan <path> [feature]` |
-| `/drill` | `explorbot drill <url>` |
-| `/know [note]` | `explorbot knows:add [url] [description]` |
+| TUI Command        | CLI Equivalent                            |
+| ------------------ | ----------------------------------------- |
+| `/explore [url]`   | `explorbot explore [path]`                |
+| `/research [url]`  | `explorbot research <url>`                |
+| `/plan [feature]`  | `explorbot plan <path> [feature]`         |
+| `/drill`           | `explorbot drill <url>`                   |
+| `/know [note]`     | `explorbot knows:add [url] [description]` |
+| `/test [scenario]` | `explorbot test <planfile> [index]`       |
+| `/freesail`        | `explorbot freesail [startUrl]`           |
+| `/rules:add`       | `explorbot add-rule [agent] [name]`       |
 
 CLI commands run headless by default, execute the task, and exit. TUI commands run inside an interactive session where you can chain multiple actions.
 
@@ -23,16 +26,16 @@ CLI commands run headless by default, execute the task, and exit. TUI commands r
 
 These options are available on all CLI commands (`start`, `explore`, `plan`, `drill`, `research`, `context`):
 
-| Option | Description |
-|--------|-------------|
-| `-v, --verbose` | Enable verbose logging |
-| `--debug` | Enable debug logging (same as `--verbose`) |
-| `-c, --config <path>` | Path to configuration file |
-| `-p, --path <path>` | Working directory path |
-| `-s, --show` | Show browser window |
-| `--headless` | Run browser in headless mode |
-| `--incognito` | Run without recording experiences |
-| `--session [file]` | Save/restore browser session (cookies, localStorage) from file |
+| Option                | Description                                                    |
+| --------------------- | -------------------------------------------------------------- |
+| `-v, --verbose`       | Enable verbose logging                                         |
+| `--debug`             | Enable debug logging (same as `--verbose`)                     |
+| `-c, --config <path>` | Path to configuration file                                     |
+| `-p, --path <path>`   | Working directory path                                         |
+| `-s, --show`          | Show browser window                                            |
+| `--headless`          | Run browser in headless mode                                   |
+| `--incognito`         | Run without recording experiences                              |
+| `--session [file]`    | Save/restore browser session (cookies, localStorage) from file |
 
 ### `--session`
 
@@ -97,12 +100,87 @@ explorbot start /dashboard
 explorbot browser stop
 ```
 
-| Option | Description |
-|--------|-------------|
-| `-s, --show` | Launch browser in headed mode (visible window) |
-| `--headless` | Launch browser in headless mode |
-| `-c, --config <path>` | Path to configuration file |
-| `-p, --path <path>` | Working directory path |
+| Option                | Description                                    |
+| --------------------- | ---------------------------------------------- |
+| `-s, --show`          | Launch browser in headed mode (visible window) |
+| `--headless`          | Launch browser in headless mode                |
+| `-c, --config <path>` | Path to configuration file                     |
+| `-p, --path <path>`   | Working directory path                         |
+
+## Test Execution
+
+### `explorbot test <planfile> [index]`
+
+Run tests from a saved plan file without launching TUI.
+
+```bash
+explorbot test plan.md 1           # run first test
+explorbot test plan.md 1-3         # run tests 1 to 3
+explorbot test plan.md 1,3,5       # run specific tests
+explorbot test plan.md *           # run all pending tests
+explorbot test plan.md all         # same as *
+```
+
+| Option             | Description                |
+| ------------------ | -------------------------- |
+| `--grep <pattern>` | Run tests matching pattern |
+
+### `explorbot shell <url> <command>`
+
+Navigate to a URL, execute a single CodeceptJS command, and exit. Useful for quick one-off browser interactions.
+
+```bash
+explorbot shell /login "I.see('Welcome')"
+explorbot shell /dashboard "I.click('Settings')"
+```
+
+## Autonomous Exploration
+
+### `explorbot freesail [startUrl]`
+
+Continuously explore and test pages autonomously. Explorbot navigates to new pages, researches them, runs tests, then moves on — indefinitely.
+
+```bash
+explorbot freesail /admin                   # start exploring from /admin
+explorbot freesail /dashboard --deep        # depth-first: explore nearby pages first
+explorbot freesail /app --shallow           # breadth-first: spread across many pages
+explorbot freesail /app --scope /admin      # only explore pages under /admin
+explorbot freesail /app --max-tests 20      # stop after 20 tests
+```
+
+| Option                | Description                                                             |
+| --------------------- | ----------------------------------------------------------------------- |
+| `--deep`              | Depth-first: prioritize newly discovered pages close to the current URL |
+| `--shallow`           | Breadth-first: pick the globally least-visited page next                |
+| `--scope <prefix>`    | Restrict to URLs starting with the given prefix                         |
+| `--max-tests <count>` | Stop after the specified number of tests                                |
+
+## API Testing
+
+### `explorbot api`
+
+AI-powered API testing. Generate and run test plans for API endpoints.
+
+```bash
+explorbot api init                          # initialize API testing project
+explorbot api plan /users                   # generate test plan for endpoint
+explorbot api plan /users --style curious   # use a specific planning style
+explorbot api test plan.md                  # run tests from plan
+explorbot api test plan.md 1-3             # run specific tests
+explorbot api know /users "CRUD endpoint"  # add API knowledge
+```
+
+## Rules Management
+
+### `explorbot add-rule [agent] [name]`
+
+Create a rule file for an agent. Opens an interactive TUI form when called without arguments.
+
+```bash
+explorbot add-rule researcher check-tooltips
+explorbot add-rule tester wait-for-toasts --url '/admin/*'
+explorbot add-rule                              # interactive mode
+```
 
 ## Exploration Commands
 
@@ -113,12 +191,17 @@ Start full exploration cycle: research → plan → test.
 ```
 /explore
 /explore /dashboard
+/explore --max-tests 5
 ```
 
 If a URL is provided, navigates there first. After completion, use `/navigate` or `/explore` again to continue.
 
 **CLI equivalent:** `explorbot explore [path]` — runs the full cycle and exits.
 
+| Option                | Description                              |
+| --------------------- | ---------------------------------------- |
+| `--max-tests <count>` | Stop after the specified number of tests |
+
 ### `/research [url] [--data]`
 
 Analyze the current page using the Researcher agent.
@@ -127,13 +210,20 @@ Analyze the current page using the Researcher agent.
 /research
 /research /settings
 /research --data
+/research --no-fix        # skip locator validation/fix cycle
 ```
 
 - If URL provided, navigates there first
 - `--data` flag extracts structured data from the page
+- `--no-fix` skips the locator validation and fix cycle
 
 **CLI equivalent:** `explorbot research <url>` — researches the page and exits.
 
+```bash
+explorbot research /dashboard --no-fix    # skip locator fix
+explorbot research /dashboard --incognito # without experience files
+```
+
 ### `/plan [feature]`
 
 Generate test scenarios for the current page using the Planner agent.
@@ -142,12 +232,38 @@ Generate test scenarios for the current page using the Planner agent.
 /plan
 /plan login
 /plan checkout flow
+/plan --style curious           # use a specific planning style
+/plan --clear                  # clear current plan and create new one
+/plan --fresh                  # re-plan from scratch, discarding existing plan
 ```
 
 Optional feature focus narrows the scope of generated tests.
 
 **CLI equivalent:** `explorbot plan <path> [feature]` — generates a plan and exits.
 
+Options:
+
+| Option            | Description                                                   |
+| ----------------- | ------------------------------------------------------------- |
+| `--style <style>` | Set planning style (`normal`, `curious`, `psycho`, or custom) |
+| `-a, --append`    | Add tests to existing plan instead of replacing it            |
+| `--clear`         | Clear the current plan and immediately create a new one       |
+| `--fresh`         | Re-plan from scratch, discarding the existing plan            |
+| `--max-tests <n>` | Limit the number of tests generated                           |
+
+### `/context [url]`
+
+Analyze the current page using the Context agent.
+
+```
+/context
+/context /settings
+/context --visual
+```
+
+- If URL provided, navigates there first
+- `--visual` flag extracts visual information from the page
+
 ### `/test [scenario|number|*]`
 
 Execute test scenarios using the Tester agent.
@@ -155,11 +271,32 @@ Execute test scenarios using the Tester agent.
 ```
 /test              # Run next pending test
 /test *            # Run all pending tests
-/test 2            # Run test #2 from plan
+/test 2            # Run test #2 from plan (visible/enabled tests)
 /test login        # Run tests matching "login"
 /test User can logout successfully   # Create and run ad-hoc test
 ```
 
+### `/freesail`
+
+Start autonomous exploration from the current page inside TUI (alias: `/freeride`).
+
+```
+/freesail
+/freesail --deep
+/freesail --shallow
+/freesail --scope /admin
+/freesail --max-tests 10
+/freesail --deep --max-tests 20
+```
+
+### `/debug`
+
+Toggle debug output on/off during a session.
+
+```
+/debug
+```
+
 ### `/navigate <target>`
 
 Navigate to a URI or state using AI assistance.
@@ -193,6 +330,29 @@ Load a previously saved plan.
 /plan:load output/plans/checkout-plan.md
 ```
 
+**CLI equivalent:** `explorbot plan:load <planfile> [index]` — display plan as table, or view test details by index.
+
+```bash
+explorbot plan:load plan.md            # show all tests in table
+explorbot plan:load plan.md 3          # show details for test #3
+```
+
+### `/plan-edit`
+
+Edit the test plan interactively in TUI — enable/disable tests, reorder.
+
+```
+/plan-edit
+```
+
+### Plan Editor
+
+When in the plan editor (opened via `/plan-edit` or `Ctrl+E`):
+
+| Key   | Action                                 |
+| ----- | -------------------------------------- |
+| `Del` | Remove the selected test from the plan |
+
 ## Page Inspection
 
 ### `/aria [--short]`
@@ -264,6 +424,16 @@ Exit the application gracefully.
 
 ## Rules & Styles
 
+### `/rules:add`
+
+Create a rule file for an agent interactively from TUI (alias: `/add-rule`).
+
+```
+/add-rule researcher check-tooltips
+/rules:add tester slow-forms
+/rules:add                              # interactive mode
+```
+
 ### `explorbot extract-styles <agent>`
 
 Extract built-in planning styles to your `rules/` directory for customization.
@@ -278,7 +448,7 @@ After extraction, edit the markdown files to customize how the Planner or Chief
 
 ## Direct Browser Control
 
-In addition to slash commands, you can execute CodeceptJS commands directly:
+In addition to slash commands, you can execute CodeceptJS `I.*` commands or raw Playwright `page.*` commands directly:
 
 ```
 I.amOnPage('/login')
@@ -288,12 +458,19 @@ I.see('Welcome')
 I.waitForElement('.modal', 5)
 ```
 
-All [CodeceptJS Playwright helpers](https://codecept.io/helpers/Playwright/) are available.
+```
+page.click('.my-button')
+page.fill('#email', 'test@example.com')
+await page.locator('.item').count()
+```
+
+All [CodeceptJS Playwright helpers](https://codecept.io/helpers/Playwright/) are available, as well as the raw Playwright `page` object.
 
 ## Keyboard Shortcuts
 
-| Key | Action |
-|-----|--------|
-| `ESC` | Enable input / cancel current action |
-| `Ctrl+T` | Toggle session timer display |
-| `Ctrl+C` | Exit application |
+| Key      | Action                               |
+| -------- | ------------------------------------ |
+| `ESC`    | Enable input / cancel current action |
+| `Ctrl+T` | Toggle session timer display         |
+| `Ctrl+C` | Exit application                     |
+| `Ctrl+E` | Open plan editor                     |
diff --git a/docs/configuration.md b/docs/configuration.md
index 5970b97..1da6d62 100644
--- a/docs/configuration.md
+++ b/docs/configuration.md
@@ -101,11 +101,11 @@ ai: {
 
 ### Rules vs Knowledge vs systemPrompt
 
-| Mechanism | Purpose | URL-aware | File-based |
-|-----------|---------|-----------|------------|
-| **Rules** | Agent-specific instructions | Yes | Yes (`rules/<agent>/`) |
-| **Knowledge** | App domain info (credentials, data) | Yes | Yes (`knowledge/`) |
-| **systemPrompt** | Quick inline instructions | No | No (in config) |
+| Mechanism        | Purpose                             | URL-aware | File-based             |
+| ---------------- | ----------------------------------- | --------- | ---------------------- |
+| **Rules**        | Agent-specific instructions         | Yes       | Yes (`rules/<agent>/`) |
+| **Knowledge**    | App domain info (credentials, data) | Yes       | Yes (`knowledge/`)     |
+| **systemPrompt** | Quick inline instructions           | No        | No (in config)         |
 
 Rules and `systemPrompt` can be used together — rules from files load first, then `systemPrompt` is appended.
 
@@ -165,16 +165,16 @@ Each agent can be individually configured with its own model and custom system p
 
 ### Available Agents
 
-| Agent | Purpose |
-|-------|---------|
-| `tester` | Executes test scenarios |
-| `planner` | Generates test plans |
-| `researcher` | Analyzes page structure |
-| `navigator` | Handles browser navigation |
-| `captain` | Orchestrates user commands |
+| Agent                  | Purpose                    |
+| ---------------------- | -------------------------- |
+| `tester`               | Executes test scenarios    |
+| `planner`              | Generates test plans       |
+| `researcher`           | Analyzes page structure    |
+| `navigator`            | Handles browser navigation |
+| `captain`              | Orchestrates user commands |
 | `experience-compactor` | Compresses experience data |
-| `quartermaster` | Accessibility analysis |
-| `historian` | Session recording |
+| `quartermaster`        | Accessibility analysis     |
+| `historian`            | Session recording          |
 
 ### Agent Options
 
@@ -191,14 +191,15 @@ agents: {
 }
 ```
 
-| Option | Type | Description |
-|--------|------|-------------|
-| `model` | `LanguageModel` | Model instance for this agent (overrides default) |
-| `enabled` | `boolean` | Enable or disable the agent |
-| `rules` | `Array<string \| Record<string, string>>` | Rule files to load from `rules/<agent>/` (URL-aware). See [Rules](#rules) |
-| `systemPrompt` | `string` | Additional instructions appended to the agent's prompt (inline fallback) |
-| `beforeHook` | `Hook \| HookPatternMap` | Code to run before agent execution |
-| `afterHook` | `Hook \| HookPatternMap` | Code to run after agent execution |
+| Option            | Type                                      | Description                                                                            |
+| ----------------- | ----------------------------------------- | -------------------------------------------------------------------------------------- |
+| `model`           | `LanguageModel`                           | Model instance for this agent (overrides default)                                      |
+| `enabled`         | `boolean`                                 | Enable or disable the agent                                                            |
+| `rules`           | `Array<string \| Record<string, string>>` | Rule files to load from `rules/<agent>/` (URL-aware). See [Rules](#rules)              |
+| `systemPrompt`    | `string`                                  | Additional instructions appended to the agent's prompt (inline fallback)               |
+| `providerOptions` | `object`                                  | Provider-specific options passed through (e.g. `{ groq: { reasoningEffort: 'low' } }`) |
+| `beforeHook`      | `Hook \| HookPatternMap`                  | Code to run before agent execution                                                     |
+| `afterHook`       | `Hook \| HookPatternMap`                  | Code to run after agent execution                                                      |
 
 See [Agent Hooks](./hooks.md) for detailed hook configuration.
 
@@ -206,12 +207,13 @@ See [Agent Hooks](./hooks.md) for detailed hook configuration.
 
 The researcher agent supports all standard agent options plus additional options for controlling interactive exploration:
 
-| Option | Type | Description |
-|--------|------|-------------|
-| `excludeSelectors` | `string[]` | CSS selectors for containers to exclude |
-| `includeSelectors` | `string[]` | CSS selectors for containers to always explore |
-| `stopWords` | `string[]` | Words to filter out (replaces defaults if provided) |
-| `maxElementsToExplore` | `number` | Maximum elements to explore per page (default: 10) |
+| Option                 | Type       | Description                                                                                     |
+| ---------------------- | ---------- | ----------------------------------------------------------------------------------------------- |
+| `excludeSelectors`     | `string[]` | CSS selectors for containers to exclude                                                         |
+| `includeSelectors`     | `string[]` | CSS selectors for containers to always explore                                                  |
+| `stopWords`            | `string[]` | Words to filter out (replaces defaults if provided)                                             |
+| `maxElementsToExplore` | `number`   | Maximum elements to explore per page (default: 10)                                              |
+| `errorPageTimeout`     | `number`   | Seconds to wait for error page recovery before giving up. Default: `10`. Set to `0` to disable. |
 
 ```javascript
 ai: {
@@ -228,6 +230,48 @@ See [Researcher Agent](./researcher.md) for detailed documentation and examples.
 
 See [AI Providers](./providers.md) for recommended models and provider setup.
 
+## Reporter
+
+Explorbot can generate HTML test reports locally without requiring a Testomatio account.
+
+```javascript
+reporter: {
+  enabled: true,   // Generate HTML reports to output/reports/
+  html: false,     // Force HTML reports even when Testomatio is configured
+}
+```
+
+| Option    | Type      | Default | Description                                                                   |
+| --------- | --------- | ------- | ----------------------------------------------------------------------------- |
+| `enabled` | `boolean` | `false` | Enable HTML report generation (auto-enabled when `TESTOMATIO` env var is set) |
+| `html`    | `boolean` | `false` | Generate HTML reports in addition to Testomatio when both are configured      |
+
+## File Uploads
+
+Provide custom files for upload tests:
+
+```javascript
+files: {
+  'Profile photo': './fixtures/photo.png',
+  'Test document': './fixtures/document.pdf',
+  'Data export': './fixtures/data.xlsx',
+}
+```
+
+Explorbot includes built-in sample files (PNG, PDF, DOCX, XLSX, ZIP, MP4, MP3). Custom entries extend the built-in set.
+
+## Experience
+
+```javascript
+experience: {
+  maxReadLines: 100,  // Maximum lines to read from each experience entry
+}
+```
+
+| Option         | Type     | Default | Description                                          |
+| -------------- | -------- | ------- | ---------------------------------------------------- |
+| `maxReadLines` | `number` | `100`   | Truncates long experience entries to this many lines |
+
 ## Playwright Settings
 
 ### Browser Selection
@@ -240,6 +284,14 @@ playwright: {
 }
 ```
 
+### Action Delay
+
+```javascript
+playwright: {
+  waitForAction: 500,  // Delay in ms after each Playwright action (default: 500)
+}
+```
+
 ### Viewport and Window Size
 
 ```javascript
@@ -338,65 +390,81 @@ explorbot explore --config ./custom/path/config.js
 export default {
   // Browser automation settings
   playwright: {
-    browser: 'chromium',           // 'chromium' | 'firefox' | 'webkit'
-    url: 'http://localhost:3000',  // Starting URL (required)
-    show: false,                   // Show browser window
-    windowSize: '1280x720',        // Browser window size
-    slowMo: 0,                     // Slow down actions (ms)
-    timeout: 30000,                // Default timeout (ms)
-    waitForNavigation: 'load',     // 'load' | 'domcontentloaded' | 'networkidle'
-    waitForTimeout: 1000,          // Wait after navigation (ms)
-    ignoreHTTPSErrors: false,      // Ignore HTTPS certificate errors
-    userAgent: 'custom-agent',     // Custom user agent string
+    browser: 'chromium', // 'chromium' | 'firefox' | 'webkit'
+    url: 'http://localhost:3000', // Starting URL (required)
+    show: false, // Show browser window
+    windowSize: '1280x720', // Browser window size
+    slowMo: 0, // Slow down actions (ms)
+    timeout: 30000, // Default timeout (ms)
+    waitForNavigation: 'load', // 'load' | 'domcontentloaded' | 'networkidle'
+    waitForTimeout: 1000, // Wait after navigation (ms)
+    ignoreHTTPSErrors: false, // Ignore HTTPS certificate errors
+    userAgent: 'custom-agent', // Custom user agent string
     viewport: {
       width: 1280,
       height: 720,
     },
-    args: ['--disable-gpu'],       // Browser launch arguments
-    chromium: { args: [] },        // Chromium-specific args
-    firefox: { args: [] },         // Firefox-specific args
-    webkit: { args: [] },          // WebKit-specific args
+    args: ['--disable-gpu'], // Browser launch arguments
+    chromium: { args: [] }, // Chromium-specific args
+    firefox: { args: [] }, // Firefox-specific args
+    webkit: { args: [] }, // WebKit-specific args
   },
 
   // AI provider settings
   ai: {
-    model: groq('gpt-oss-20b'),          // Default model instance (required)
-    visionModel: groq('llama-scout-4'),  // Model for screenshot analysis
-    vision: true,                  // Enable vision features
-    maxAttempts: 3,                // Retry attempts for AI calls
-    retryDelay: 1000,              // Delay between retries (ms)
-    config: {},                    // Additional provider config
-    langfuse: {                    // Observability settings
+    model: groq('gpt-oss-20b'), // Default model instance (required)
+    visionModel: groq('llama-scout-4'), // Model for screenshot analysis
+    agenticModel: groq('gpt-oss-120b'), // Model for agentic tasks (Captain, Pilot verdict review)
+    vision: true, // Enable vision features
+    maxAttempts: 3, // Retry attempts for AI calls
+    retryDelay: 1000, // Delay between retries (ms)
+    config: {}, // Additional provider config
+    langfuse: {
+      // Observability settings
       enabled: true,
       publicKey: 'pk-...',
       secretKey: 'sk-...',
       baseUrl: 'https://cloud.langfuse.com',
     },
-    agents: {                      // Per-agent configuration
+    agents: {
+      // Per-agent configuration
       tester: {
         model: groq('gpt-oss-20b'),
         enabled: true,
         rules: ['wait-for-toasts', { '/admin/*': 'admin-creds' }],
-        systemPrompt: '...',       // Inline fallback
+        systemPrompt: '...', // Inline fallback
       },
       planner: {
         styles: ['normal', 'psycho', 'curious'],
         rules: [{ '/checkout/*': 'payment-rules' }],
       },
-      researcher: {                // Researcher-specific options
+      researcher: {
+        // Researcher-specific options
         model: groq('gpt-oss-20b'), // Override default model
-        enabled: true,             // Enable/disable agent
-        systemPrompt: '...',       // Additional instructions
-        excludeSelectors: [],      // CSS selectors to exclude
-        includeSelectors: [],      // CSS selectors to always explore
-        stopWords: [],             // Text patterns to skip (replaces defaults)
-        maxElementsToExplore: 10,  // Max elements per page
+        enabled: true, // Enable/disable agent
+        systemPrompt: '...', // Additional instructions
+        excludeSelectors: [], // CSS selectors to exclude
+        includeSelectors: [], // CSS selectors to always explore
+        stopWords: [], // Text patterns to skip (replaces defaults)
+        maxElementsToExplore: 10, // Max elements per page
+        errorPageTimeout: 10, // Seconds to wait for error page recovery (0 to disable)
+        providerOptions: {}, // Provider-specific options
+      },
+      navigator: {
+        /* ... */
+      },
+      captain: {
+        /* ... */
+      },
+      'experience-compactor': {
+        /* ... */
+      },
+      quartermaster: {
+        /* ... */
+      },
+      historian: {
+        /* ... */
       },
-      navigator: { /* ... */ },
-      captain: { /* ... */ },
-      'experience-compactor': { /* ... */ },
-      quartermaster: { /* ... */ },
-      historian: { /* ... */ },
     },
   },
 
@@ -416,17 +484,33 @@ export default {
     },
   },
 
+  // Reporter settings
+  reporter: {
+    enabled: false, // Generate HTML reports to output/reports/
+    html: false, // Force HTML reports even when Testomatio is configured
+  },
+
+  // Custom files for upload tests
+  files: {
+    // 'Profile photo': './fixtures/photo.png',
+  },
+
+  // Experience settings
+  experience: {
+    maxReadLines: 100, // Max lines to read from each experience entry
+  },
+
   // Action execution settings
   action: {
-    delay: 1000,                   // Delay between actions (ms)
-    retries: 3,                    // Retry failed actions
+    delay: 1000, // Delay between actions (ms)
+    retries: 3, // Retry failed actions
   },
 
   // Directory paths
   dirs: {
-    knowledge: 'knowledge',        // Domain knowledge files
-    experience: 'experience',      // Learned patterns
-    output: 'output',              // Test results and logs
+    knowledge: 'knowledge', // Domain knowledge files
+    experience: 'experience', // Learned patterns
+    output: 'output', // Test results and logs
   },
 };
 ```
diff --git a/docs/planner.md b/docs/planner.md
index 2f7b94a..6ef5deb 100644
--- a/docs/planner.md
+++ b/docs/planner.md
@@ -31,13 +31,13 @@ ai: {
 
 ### Options Reference
 
-| Option | Type | Default | Description |
-|--------|------|---------|-------------|
-| `model` | `LanguageModel` | default model | Override model for Planner |
-| `styles` | `string[]` | `['normal', 'psycho', 'curious']` | Style names and cycling order |
-| `stylesDir` | `string` | `rules/planner/styles/` | Custom directory for style files |
-| `rules` | `RuleEntry[]` | `[]` | URL-aware rule files from `rules/planner/` |
-| `systemPrompt` | `string` | - | Inline instructions appended to the prompt |
+| Option         | Type            | Default                           | Description                                |
+| -------------- | --------------- | --------------------------------- | ------------------------------------------ |
+| `model`        | `LanguageModel` | default model                     | Override model for Planner                 |
+| `styles`       | `string[]`      | `['normal', 'curious', 'psycho']` | Style names and cycling order              |
+| `stylesDir`    | `string`        | `rules/planner/styles/`           | Custom directory for style files           |
+| `rules`        | `RuleEntry[]`   | `[]`                              | URL-aware rule files from `rules/planner/` |
+| `systemPrompt` | `string`        | -                                 | Inline instructions appended to the prompt |
 
 ## Planning Styles
 
@@ -45,22 +45,22 @@ Each time the Planner generates scenarios, it applies a **style** — a testing
 
 ### Built-in Styles
 
-| Style | Focus | What it generates |
-|-------|-------|-------------------|
-| **normal** | Complete user workflows | CRUD operations, form submissions, filter+verify flows. Each test changes application state. Distributes tests across all feature areas. |
-| **psycho** | Invalid and extreme inputs | Empty submissions, 10000-character strings, special characters, SQL injection, wrong formats, boundary values, incompatible combinations. Finds what breaks. |
-| **curious** | Coverage gaps | Cross-references previous test results with page research to find untested controls. Exercises every select option, checkbox state, and skipped form field. Fills gaps, not repeats. |
+| Style       | Focus                      | What it generates                                                                                                                                                                    |
+| ----------- | -------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| **normal**  | Complete user workflows    | CRUD operations, form submissions, filter+verify flows. Each test changes application state. Distributes tests across all feature areas.                                             |
+| **psycho**  | Invalid and extreme inputs | Empty submissions, 10000-character strings, special characters, SQL injection, wrong formats, boundary values, incompatible combinations. Finds what breaks.                         |
+| **curious** | Coverage gaps              | Cross-references previous test results with page research to find untested controls. Exercises every select option, checkbox state, and skipped form field. Fills gaps, not repeats. |
 
 ### How Cycling Works
 
-The default cycle is: **normal** → **psycho** → **curious** → **normal** → ...
+The default cycle is: **normal** → **curious** → **psycho** → **normal** → ...
 
-| Iteration | Style | Purpose |
-|-----------|-------|---------|
-| 1st `/plan` | normal | Cover core workflows and CRUD operations |
-| 2nd `/plan` | psycho | Stress-test with invalid and extreme inputs |
-| 3rd `/plan` | curious | Fill coverage gaps from previous iterations |
-| 4th `/plan` | normal | Re-examine with fresh research |
+| Iteration   | Style   | Purpose                                     |
+| ----------- | ------- | ------------------------------------------- |
+| 1st `/plan` | normal  | Cover core workflows and CRUD operations    |
+| 2nd `/plan` | curious | Fill coverage gaps from previous iterations |
+| 3rd `/plan` | psycho  | Stress-test with invalid and extreme inputs |
+| 4th `/plan` | normal  | Re-examine with fresh research              |
 
 Each iteration only proposes scenarios that don't already exist in the plan. When all feature areas are covered, the Planner returns an empty list.
 
@@ -99,6 +99,7 @@ Create `rules/planner/styles/security.md`:
 
 ```markdown
 Focus on security-related scenarios:
+
 - Test all inputs for XSS by entering <script> tags
 - Check that sensitive data is masked in the UI
 - Verify that unauthorized actions show proper error messages
@@ -124,6 +125,14 @@ planner: {
 }
 ```
 
+Use the default order (normal → curious → psycho):
+
+```javascript
+planner: {
+  styles: ['normal', 'curious', 'psycho'],
+}
+```
+
 Alternate between normal and security:
 
 ```javascript
@@ -153,6 +162,7 @@ Write it as instructions to a senior QA engineer describing how to think about t
 Think like a real user of this product. What would they actually do on this page?
 
 Prefer maximal realistic happy paths:
+
 - Fill required AND optional fields
 - Set meaningful non-default choices
 - Continue the story after creation (open the item, adjust attributes, add a note)
@@ -185,13 +195,15 @@ Rules are additive — all matching rules are concatenated and appended to the P
 
 The Planner assigns priorities based on business importance:
 
-| Priority | Meaning | Examples |
-|----------|---------|---------|
-| **critical** | Core business functionality | Login, checkout, primary CRUD |
-| **important** | Key user flows | Profile edit, search, main filters |
-| **high** | Secondary features | Edge cases for critical flows |
-| **normal** | Supporting actions | Settings, configuration |
-| **low** | Minor interactions | Cosmetic checks, boundary tests |
+| Priority      | Meaning                     | Examples                           |
+| ------------- | --------------------------- | ---------------------------------- |
+| **critical**  | Core business functionality | Login, checkout, primary CRUD      |
+| **important** | Key user flows              | Profile edit, search, main filters |
+| **high**      | Secondary features          | Edge cases for critical flows      |
+| **normal**    | Supporting actions          | Settings, configuration            |
+| **low**       | Minor interactions          | Cosmetic checks, boundary tests    |
+
+Tests that create, update, or delete data are prioritized over UI-only interactions (view switching, filtering, pagination).
 
 ## See Also
 
diff --git a/docs/researcher.md b/docs/researcher.md
index c533e42..3d167b3 100644
--- a/docs/researcher.md
+++ b/docs/researcher.md
@@ -36,17 +36,18 @@ ai: {
 
 ### Options Reference
 
-| Option | Type | Default | Description |
-|--------|------|---------|-------------|
-| `model` | `string` | - | Override default model for Researcher |
-| `systemPrompt` | `string` | - | Additional instructions appended to the research prompt |
-| `sections` | `string[]` | all sections | Page sections to identify (order = priority) |
-| `excludeSelectors` | `string[]` | `[]` | CSS selectors to exclude from deep exploration |
-| `includeSelectors` | `string[]` | `[]` | CSS selectors to always explore (second pass) |
-| `stopWords` | `string[]` | defaults | Words to filter during deep exploration (replaces defaults) |
-| `maxElementsToExplore` | `number` | `10` | Max elements per deep exploration |
-| `retries` | `number` | `2` | Retries when most locators are broken in Stage 2 |
-| `providerOptions` | `object` | - | Provider-specific options (e.g. reasoning effort) |
+| Option                 | Type       | Default      | Description                                                                      |
+| ---------------------- | ---------- | ------------ | -------------------------------------------------------------------------------- |
+| `model`                | `string`   | -            | Override default model for Researcher                                            |
+| `systemPrompt`         | `string`   | -            | Additional instructions appended to the research prompt                          |
+| `sections`             | `string[]` | all sections | Page sections to identify (order = priority)                                     |
+| `excludeSelectors`     | `string[]` | `[]`         | CSS selectors to exclude from deep exploration                                   |
+| `includeSelectors`     | `string[]` | `[]`         | CSS selectors to always explore (second pass)                                    |
+| `stopWords`            | `string[]` | defaults     | Words to filter during deep exploration (replaces defaults)                      |
+| `maxElementsToExplore` | `number`   | `10`         | Max elements per deep exploration                                                |
+| `retries`              | `number`   | `2`          | Retries when most locators are broken in Stage 2                                 |
+| `errorPageTimeout`     | `number`   | `10`         | Seconds to wait for error page recovery before giving up. Set to `0` to disable. |
+| `providerOptions`      | `object`   | -            | Provider-specific options (e.g. reasoning effort)                                |
 
 See [Configuration Examples](#configuration-examples) at the end of this document for common setups.
 
@@ -110,13 +111,14 @@ Before research begins, Explorbot injects `data-explorbot-eidx` attributes into
 
 This eidx serves as a stable bridge between three different representations of the same element:
 
-| Representation | What it provides | Where eidx appears |
-|----------------|------------------|--------------------|
-| **HTML** | Structure, attributes, CSS selectors | `<button eidx="5">Save</button>` |
-| **ARIA tree** | Accessible roles, names | Mapped back via Playwright `getByRole` |
-| **Screenshot** | Visual position, color, icon | Colored label `5` drawn above the element |
+| Representation | What it provides                     | Where eidx appears                        |
+| -------------- | ------------------------------------ | ----------------------------------------- |
+| **HTML**       | Structure, attributes, CSS selectors | `<button eidx="5">Save</button>`          |
+| **ARIA tree**  | Accessible roles, names              | Mapped back via Playwright `getByRole`    |
+| **Screenshot** | Visual position, color, icon         | Colored label `5` drawn above the element |
 
 When AI produces a research table with `eidx=5`, that same index is used to:
+
 - Test the element's CSS locator against the live DOM
 - Look up its coordinates from the annotated screenshot
 - Generate a fallback XPath if CSS is broken
@@ -127,13 +129,13 @@ Without eidx, there would be no reliable way to correlate "the third button in t
 
 Research processes each page through 5 stages:
 
-| Stage | Name | What happens |
-|-------|------|--------------|
-| 1 | **Research** (AI) | AI analyzes HTML + ARIA, produces UI map with sections, containers, ARIA locators, CSS locators, eidx references |
-| 2 | **Test** | Test containers first, then element locators. Capture exact counts (`0 elements`, `3 elements`, `dynamic ID`). If all containers broken or >80% locators broken — retry Stage 1 |
-| 3 | **Fix** (AI, same conversation) | Continue Stage 1 conversation with Playwright test results. AI fixes broken locators with full page context |
-| 4 | **Visual** (optional) | Annotate screenshot with eidx labels. AI extracts coordinates, colors, icons. Merge into research by eidx |
-| 5 | **Backfill** | Re-test all locators. For still-broken elements: look up eidx in DOM, generate XPath from attributes. Nullify containers that are still broken |
+| Stage | Name                            | What happens                                                                                                                                                                    |
+| ----- | ------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| 1     | **Research** (AI)               | AI analyzes HTML + ARIA, produces UI map with sections, containers, ARIA locators, CSS locators, eidx references                                                                |
+| 2     | **Test**                        | Test containers first, then element locators. Capture exact counts (`0 elements`, `3 elements`, `dynamic ID`). If all containers broken or >80% locators broken — retry Stage 1 |
+| 3     | **Fix** (AI, same conversation) | Continue Stage 1 conversation with Playwright test results. AI fixes broken locators with full page context                                                                     |
+| 4     | **Visual** (optional)           | Annotate screenshot with eidx labels. AI extracts coordinates, colors, icons. Merge into research by eidx                                                                       |
+| 5     | **Backfill**                    | Re-test all locators. For still-broken elements: look up eidx in DOM, generate XPath from attributes. Nullify containers that are still broken                                  |
 
 Stage 3 reuses the Stage 1 conversation — the AI already has full context about the page HTML, so it fixes locators more accurately without extra token cost.
 
@@ -167,22 +169,29 @@ Extracts domain-specific content (articles, products, users) as structured data.
 
 The Researcher breaks pages into sections based on their UI purpose. Sections are identified in priority order:
 
-| Section | Description |
-|---------|-------------|
-| `focus` | Focused overlay (modal, drawer, popup, active form) |
-| `list` | List area (items collection, table, cards, or list view) |
-| `detail` | Detail area (selected item preview or full details) |
-| `panes` | Screen is split into equal panes |
-| `content` | Main area of page |
-| `menu` | Page menu (toolbar, context actions, filters, dropdowns) |
-| `navigation` | Main navigation (top bar, sidebar, breadcrumbs) |
+| Section      | Description                                              |
+| ------------ | -------------------------------------------------------- |
+| `focus`      | Focused overlay (modal, drawer, popup, active form)      |
+| `list`       | List area (items collection, table, cards, or list view) |
+| `detail`     | Detail area (selected item preview or full details)      |
+| `panes`      | Screen is split into equal panes                         |
+| `content`    | Main area of page                                        |
+| `menu`       | Page menu (toolbar, context actions, filters, dropdowns) |
+| `navigation` | Main navigation (top bar, sidebar, breadcrumbs)          |
 
 Each section includes:
+
 - A **container CSS selector** scoping all elements within
 - A **UI map table** listing interactive elements with ARIA and CSS locators
 
 Override the default section list via `ai.agents.researcher.sections` — see [Configuration](#configuration).
 
+### Focused Section
+
+The Researcher automatically identifies the user's primary interaction area using AI declaration, ARIA analysis, and visual fallback. The focused section (e.g., an open dialog, main content area) is marked in the research output. The Planner prioritizes tests for the focused section first.
+
+> Section names cannot be "Focus" or "Focused" — they must describe their content (e.g., "Detail", "Modal", "Form").
+
 ## Vision Model Support
 
 ### Without Vision
@@ -217,6 +226,7 @@ Vision is particularly useful for pages with icon-only buttons, canvas-based UIs
 Deep exploration (`--deep` flag) discovers hidden UI by clicking through elements to find modals, dropdowns, tabs, and menus.
 
 For each element, the researcher:
+
 1. Captures state before click
 2. Clicks the element
 3. Detects what changed (navigation, modal, menu, UI change)
@@ -235,6 +245,7 @@ Only clickable roles are explored: `button`, `link`, `menuitem`, `tab`, `option`
 Elements matching these words are skipped (word-boundary matching):
 
 **Default stop words:**
+
 - `close`, `cancel`, `dismiss`, `exit`, `back`
 - `cookie`, `consent`, `gdpr`, `privacy`
 - `accept all`, `decline all`, `reject all`
@@ -275,11 +286,11 @@ Modal dialog for user login...
 
 > Container: '[role="dialog"]'
 
-| Element | ARIA | CSS |
-|---------|------|-----|
-| 'Email' | { role: 'textbox', text: 'Email' } | 'input#email' |
+| Element    | ARIA                                  | CSS                      |
+| ---------- | ------------------------------------- | ------------------------ |
+| 'Email'    | { role: 'textbox', text: 'Email' }    | 'input#email'            |
 | 'Password' | { role: 'textbox', text: 'Password' } | 'input[name="password"]' |
-| 'Sign In' | { role: 'button', text: 'Sign In' } | 'button[type="submit"]' |
+| 'Sign In'  | { role: 'button', text: 'Sign In' }   | 'button[type="submit"]'  |
 
 ## Content Section
 
@@ -287,13 +298,14 @@ Main content area...
 
 > Container: '.main-content'
 
-| Element | ARIA | CSS | XPath | Coordinates |
-|---------|------|-----|-------|-------------|
-| 'Save' | { role: 'button', text: 'Save' } | 'button.save' | - | (400, 300) |
-| 'Delete' | { role: 'button', text: 'Delete' } | - | '//button[@class="del"]' | (500, 300) |
+| Element  | ARIA                               | CSS           | XPath                    | Coordinates |
+| -------- | ---------------------------------- | ------------- | ------------------------ | ----------- |
+| 'Save'   | { role: 'button', text: 'Save' }   | 'button.save' | -                        | (400, 300)  |
+| 'Delete' | { role: 'button', text: 'Delete' } | -             | '//button[@class="del"]' | (500, 300)  |
 ```
 
 Notes:
+
 - XPath column only appears when CSS is broken and XPath was backfilled from the DOM
 - Coordinates column only appears when vision model analyzed the screenshot
 - Container is shown as a blockquote `> Container: '...'` before the table
@@ -301,9 +313,12 @@ Notes:
 ## Caching
 
 Research results are cached for 1 hour:
+
 - In memory during session
 - On disk in `output/research/`
 
+Similar pages reuse cached research via HTML fingerprint matching — if the page structure hasn't changed, re-analysis is skipped automatically.
+
 Use `--force` to bypass cache:
 
 ```bash
diff --git a/package.json b/package.json
index fb5254a..f9df5a5 100644
--- a/package.json
+++ b/package.json
@@ -31,12 +31,18 @@
     "check:fix": "biome check --write .",
     "langfuse:export": "bun run .claude/skills/explorbot-debug/langfuse-export.ts"
   },
-  "keywords": ["cli", "react", "ink", "codeceptjs", "playwright"],
+  "keywords": [
+    "cli",
+    "react",
+    "ink",
+    "codeceptjs",
+    "playwright"
+  ],
   "author": "",
   "dependencies": {
     "@ai-sdk/anthropic": "^3.0",
     "@ai-sdk/groq": "^3.0",
-    "@ai-sdk/openai": "^3.0",
+    "@ai-sdk/openai": "^3.0.49",
     "@axe-core/playwright": "^4.11.0",
     "@inkjs/ui": "^2.0.0",
     "@langfuse/otel": "^4.5.1",
@@ -49,7 +55,7 @@
     "@opentelemetry/sdk-trace-base": "^2.2.0",
     "@opentelemetry/semantic-conventions": "^1.38.0",
     "@scalar/openapi-parser": "^0.25.6",
-    "@testomatio/reporter": "2.7.3",
+    "@testomatio/reporter": "2.7.6",
     "ai": "^6.0.6",
     "axe-core": "^4.11.1",
     "bash-tool": "^1.3.15",