test(e2e): split + expand agent-scenarios into Phase A (22 → 47 tests)

- phase-a-structure.test.ts (156 lines, 14 tests): structural integrity,
  settings panel, sidebar gear, accent colors, project name/icon, grid layout
- phase-a-agent.test.ts (210 lines, 14 tests): agent pane, prompts,
  provider badge, cost display, context meter, status transitions
- phase-a-navigation.test.ts (297 lines, 19 tests): terminal tabs,
  command palette, focus switching, palette categories, shortcut hints
- Original agent-scenarios.test.ts (429 lines) deleted
- 25 new exhaustive tests added
This commit is contained in:
Hibryda 2026-03-18 03:46:40 +01:00
parent 56971c3f27
commit 718133f9f6
7 changed files with 673 additions and 434 deletions

View file

@ -79,7 +79,7 @@
- v3 workspace store (`workspace.svelte.ts`) replaces layout store for v3. Groups loaded from `~/.config/agor/groups.json` via `groups-bridge.ts`. State: groups, activeGroupId, activeTab, focusedProjectId. Derived: activeGroup, activeProjects.
- v3 groups backend (`groups.rs`): load_groups(), save_groups(), default_groups(). Tauri commands: groups_load, groups_save.
- Telemetry (`telemetry.rs`): tracing + optional OTLP export to Tempo. `AGOR_OTLP_ENDPOINT` env var controls (absent = console-only). TelemetryGuard in AppState with Drop-based shutdown. Frontend events route through `frontend_log` Tauri command → Rust tracing (no browser OTEL SDK — WebKit2GTK incompatible). `telemetry-bridge.ts` provides `tel.info/warn/error()` convenience API. Docker stack at `docker/tempo/` (Grafana port 9715).
- E2E test mode (`AGOR_TEST=1`): watcher.rs and fs_watcher.rs skip file watchers, wake-scheduler disabled via `disableWakeScheduler()`, `is_test_mode` Tauri command bridges to frontend. Data/config dirs overridable via `AGOR_TEST_DATA_DIR`/`AGOR_TEST_CONFIG_DIR`. E2E uses WebDriverIO + tauri-driver, single session, TCP readiness probe. Phase A: 7 data-testid-based scenarios in `agent-scenarios.test.ts` (deterministic assertions). Phase B: 6 scenarios in `phase-b.test.ts` (multi-project grid, independent tab switching, status bar fleet state, LLM-judged agent responses/code generation, context tab verification). LLM judge (`llm-judge.ts`): raw fetch to Anthropic API using claude-haiku-4-5, structured verdict (pass/fail + reasoning + confidence), `assertWithJudge()` with configurable threshold, skips when `ANTHROPIC_API_KEY` absent. CI workflow (`.github/workflows/e2e.yml`): unit + cargo + e2e jobs, xvfb-run, path-filtered triggers, LLM tests gated on secret. Test fixtures in `fixtures.ts` create isolated temp environments. Results tracked via JSON store in `results-db.ts`.
- E2E test mode (`AGOR_TEST=1`): watcher.rs and fs_watcher.rs skip file watchers, wake-scheduler disabled via `disableWakeScheduler()`, `is_test_mode` Tauri command bridges to frontend. Data/config dirs overridable via `AGOR_TEST_DATA_DIR`/`AGOR_TEST_CONFIG_DIR`. E2E uses WebDriverIO + tauri-driver, single session, TCP readiness probe. Phase A: 7 data-testid-based scenarios split across `phase-a-structure.test.ts`, `phase-a-agent.test.ts`, `phase-a-navigation.test.ts` (42 tests, deterministic assertions). Phase B: 6 scenarios in `phase-b.test.ts` (multi-project grid, independent tab switching, status bar fleet state, LLM-judged agent responses/code generation, context tab verification). LLM judge (`llm-judge.ts`): raw fetch to Anthropic API using claude-haiku-4-5, structured verdict (pass/fail + reasoning + confidence), `assertWithJudge()` with configurable threshold, skips when `ANTHROPIC_API_KEY` absent. CI workflow (`.github/workflows/e2e.yml`): unit + cargo + e2e jobs, xvfb-run, path-filtered triggers, LLM tests gated on secret. Test fixtures in `fixtures.ts` create isolated temp environments. Results tracked via JSON store in `results-db.ts`.
- v3 SQLite additions: agent_messages table (per-project message persistence), project_agent_state table (sdkSessionId, cost, status per project), sessions.project_id column.
- v3 App.svelte: VSCode-style sidebar layout. Horizontal: left icon rail (GlobalTabBar, 2.75rem, single Settings gear icon) + expandable drawer panel (Settings only, content-driven width, max 50%) + main workspace (ProjectGrid always visible) + StatusBar. Sidebar has Settings only — Sessions/Docs/Context are project-specific (in ProjectBox tabs). Keyboard: Ctrl+B (toggle sidebar), Ctrl+, (settings), Escape (close).
- v3 component tree: App -> GlobalTabBar (settings icon) + sidebar-panel? (SettingsTab) + workspace (ProjectGrid) + StatusBar. See `docs/architecture.md` for full tree.

View file

@ -42,7 +42,9 @@ tests/e2e/
│ └── test-mode-constants.ts # Typed env var names for test mode
└── specs/ # Test specifications
├── agor.test.ts # Smoke + UI tests (50+ tests)
├── agent-scenarios.test.ts # Phase A: agent interaction (22 tests)
├── phase-a-structure.test.ts # Phase A: structural integrity + settings (12 tests)
├── phase-a-agent.test.ts # Phase A: agent pane + prompts (15 tests)
├── phase-a-navigation.test.ts # Phase A: terminal + palette + focus (15 tests)
├── phase-b.test.ts # Phase B: multi-project + LLM judge
└── phase-c.test.ts # Phase C: hardening features (11 scenarios)
```
@ -67,7 +69,7 @@ tests/e2e/
| Phase | File | Tests | Type |
|-------|------|-------|------|
| Smoke | agor.test.ts | 50+ | Deterministic (CSS/DOM assertions) |
| A | agent-scenarios.test.ts | 22 | Deterministic (data-testid selectors) |
| A | phase-a-{structure,agent,navigation}.test.ts | 42 | Deterministic (data-testid selectors) |
| B | phase-b.test.ts | 6+ | LLM-judged (multi-project, agent quality) |
| C | phase-c.test.ts | 11 scenarios | Mixed (deterministic + LLM-judged) |

View file

@ -1,429 +0,0 @@
import { browser, expect } from '@wdio/globals';
// Phase A: Human-authored E2E scenarios with deterministic assertions.
// These test the agent UI flow end-to-end using stable data-testid selectors.
// Agent-interaction tests require a real Claude CLI install + API key.
// ─── Helpers ──────────────────────────────────────────────────────────
/** Wait for agent status to reach a target value within timeout. */
async function waitForAgentStatus(
status: string,
timeout = 30_000,
): Promise<void> {
await browser.waitUntil(
async () => {
const attr = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'idle';
});
return attr === status;
},
{ timeout, timeoutMsg: `Agent did not reach status "${status}" within ${timeout}ms` },
);
}
/** Check if an agent pane exists and is visible. */
async function agentPaneExists(): Promise<boolean> {
const el = await browser.$('[data-testid="agent-pane"]');
return el.isExisting();
}
/** Type a prompt into the agent textarea and submit. */
async function sendAgentPrompt(text: string): Promise<void> {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.waitForDisplayed({ timeout: 5000 });
await textarea.setValue(text);
// Small delay for Svelte reactivity
await browser.pause(200);
const submitBtn = await browser.$('[data-testid="agent-submit"]');
await browser.execute((el) => (el as HTMLElement).click(), submitBtn);
}
// ─── Scenario 1: App renders with project grid and data-testid anchors ───
describe('Scenario 1 — App Structural Integrity', () => {
it('should render the status bar with data-testid', async () => {
const bar = await browser.$('[data-testid="status-bar"]');
await expect(bar).toBeDisplayed();
});
it('should render the sidebar rail with data-testid', async () => {
const rail = await browser.$('[data-testid="sidebar-rail"]');
await expect(rail).toBeDisplayed();
});
it('should render at least one project box with data-testid', async () => {
const boxes = await browser.$$('[data-testid="project-box"]');
expect(boxes.length).toBeGreaterThanOrEqual(1);
});
it('should have data-project-id on project boxes', async () => {
const projectId = await browser.execute(() => {
const box = document.querySelector('[data-testid="project-box"]');
return box?.getAttribute('data-project-id') ?? null;
});
expect(projectId).not.toBeNull();
expect((projectId as string).length).toBeGreaterThan(0);
});
it('should render project tabs with data-testid', async () => {
const tabs = await browser.$('[data-testid="project-tabs"]');
await expect(tabs).toBeDisplayed();
});
it('should render agent session component', async () => {
const session = await browser.$('[data-testid="agent-session"]');
await expect(session).toBeDisplayed();
});
});
// ─── Scenario 2: Settings panel via data-testid ──────────────────────
describe('Scenario 2 — Settings Panel (data-testid)', () => {
it('should open settings via data-testid button', async () => {
// Use JS click for reliability with WebKit2GTK/tauri-driver
await browser.execute(() => {
const btn = document.querySelector('[data-testid="settings-btn"]');
if (btn) (btn as HTMLElement).click();
});
const panel = await browser.$('.sidebar-panel');
await panel.waitForDisplayed({ timeout: 5000 });
// Wait for settings content to mount
await browser.waitUntil(
async () => {
const count = await browser.execute(() =>
document.querySelectorAll('.settings-tab .settings-section').length,
);
return (count as number) >= 1;
},
{ timeout: 5000 },
);
await expect(panel).toBeDisplayed();
});
it('should close settings with Escape', async () => {
await browser.keys('Escape');
const panel = await browser.$('.sidebar-panel');
await panel.waitForDisplayed({ timeout: 3000, reverse: true });
});
});
// ─── Scenario 3: Agent pane initial state ────────────────────────────
describe('Scenario 3 — Agent Pane Initial State', () => {
it('should display agent pane in idle status', async () => {
const exists = await agentPaneExists();
if (!exists) {
// Agent pane might not be visible until Model tab is active
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
}
const pane = await browser.$('[data-testid="agent-pane"]');
await expect(pane).toBeExisting();
const status = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'unknown';
});
expect(status).toBe('idle');
});
it('should show prompt textarea', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await expect(textarea).toBeDisplayed();
});
it('should show submit button', async () => {
const btn = await browser.$('[data-testid="agent-submit"]');
await expect(btn).toBeExisting();
});
it('should have empty messages area initially', async () => {
const msgArea = await browser.$('[data-testid="agent-messages"]');
await expect(msgArea).toBeExisting();
// No message bubbles should exist in a fresh session
const msgCount = await browser.execute(() => {
const area = document.querySelector('[data-testid="agent-messages"]');
if (!area) return 0;
return area.querySelectorAll('.message').length;
});
expect(msgCount).toBe(0);
});
});
// ─── Scenario 4: Terminal tab management ─────────────────────────────
describe('Scenario 4 — Terminal Tab Management (data-testid)', () => {
before(async () => {
// Ensure Model tab is active and terminal section visible
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
// Expand terminal section
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
if (toggle) (toggle as HTMLElement).click();
});
await browser.pause(500);
});
it('should display terminal tabs container', async () => {
const tabs = await browser.$('[data-testid="terminal-tabs"]');
await expect(tabs).toBeDisplayed();
});
it('should add a shell tab via data-testid button', async () => {
await browser.execute(() => {
const btn = document.querySelector('[data-testid="tab-add"]');
if (btn) (btn as HTMLElement).click();
});
await browser.pause(500);
const tabTitle = await browser.execute(() => {
const el = document.querySelector('.tab-bar .tab-title');
return el?.textContent ?? '';
});
expect(tabTitle.toLowerCase()).toContain('shell');
});
it('should show active tab styling', async () => {
const activeTab = await browser.$('.tab.active');
await expect(activeTab).toBeExisting();
});
it('should close tab and show empty state', async () => {
// Close all tabs
await browser.execute(() => {
const closeBtns = document.querySelectorAll('.tab-close');
closeBtns.forEach(btn => (btn as HTMLElement).click());
});
await browser.pause(500);
// Should show empty terminal area with "Open terminal" button
const emptyBtn = await browser.$('.add-first');
await expect(emptyBtn).toBeDisplayed();
});
after(async () => {
// Collapse terminal section
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
const chevron = toggle?.querySelector('.toggle-chevron.expanded');
if (chevron) (toggle as HTMLElement).click();
});
await browser.pause(300);
});
});
// ─── Scenario 5: Command palette with data-testid ───────────────────
describe('Scenario 5 — Command Palette (data-testid)', () => {
it('should open palette and show data-testid input', async () => {
await browser.execute(() => document.body.focus());
await browser.pause(200);
await browser.keys(['Control', 'k']);
const palette = await browser.$('[data-testid="command-palette"]');
await palette.waitForDisplayed({ timeout: 3000 });
const input = await browser.$('[data-testid="palette-input"]');
await expect(input).toBeDisplayed();
});
it('should have focused input', async () => {
// Use programmatic focus check (auto-focus may not work in WebKit2GTK/tauri-driver)
const isFocused = await browser.execute(() => {
const el = document.querySelector('[data-testid="palette-input"]') as HTMLInputElement | null;
if (!el) return false;
el.focus(); // Ensure focus programmatically
return el === document.activeElement;
});
expect(isFocused).toBe(true);
});
it('should show at least one group item', async () => {
const items = await browser.$$('.palette-item');
expect(items.length).toBeGreaterThanOrEqual(1);
});
it('should filter and show no-results for nonsense query', async () => {
const input = await browser.$('[data-testid="palette-input"]');
await input.setValue('zzz_no_match_xyz');
await browser.pause(300);
const noResults = await browser.$('.no-results');
await expect(noResults).toBeDisplayed();
});
it('should close on Escape', async () => {
await browser.keys('Escape');
const palette = await browser.$('[data-testid="command-palette"]');
await browser.waitUntil(
async () => !(await palette.isDisplayed()),
{ timeout: 3000 },
);
});
});
// ─── Scenario 6: Project focus and tab switching ─────────────────────
describe('Scenario 6 — Project Focus & Tab Switching', () => {
it('should focus project on header click', async () => {
await browser.execute(() => {
const header = document.querySelector('.project-header');
if (header) (header as HTMLElement).click();
});
await browser.pause(300);
const activeBox = await browser.$('.project-box.active');
await expect(activeBox).toBeDisplayed();
});
it('should switch to Files tab and back without losing agent session', async () => {
// Get current agent session element reference
const sessionBefore = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-session"]');
return el !== null;
});
expect(sessionBefore).toBe(true);
// Switch to Files tab (second tab)
await browser.execute(() => {
const tabs = document.querySelectorAll('[data-testid="project-tabs"] .ptab');
if (tabs.length >= 2) (tabs[1] as HTMLElement).click();
});
await browser.pause(500);
// AgentSession should still exist in DOM (display:none, not unmounted)
const sessionDuring = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-session"]');
return el !== null;
});
expect(sessionDuring).toBe(true);
// Switch back to Model tab
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
// Agent session should be visible again
const session = await browser.$('[data-testid="agent-session"]');
await expect(session).toBeDisplayed();
});
it('should preserve agent status across tab switches', async () => {
const statusBefore = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'unknown';
});
// Switch to Context tab (third tab) and back
await browser.execute(() => {
const tabs = document.querySelectorAll('[data-testid="project-tabs"] .ptab');
if (tabs.length >= 3) (tabs[2] as HTMLElement).click();
});
await browser.pause(300);
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
const statusAfter = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'unknown';
});
expect(statusAfter).toBe(statusBefore);
});
});
// ─── Scenario 7: Agent prompt interaction (requires Claude CLI) ──────
describe('Scenario 7 — Agent Prompt Submission', () => {
// This scenario requires a real Claude CLI + API key.
// Skip gracefully if agent doesn't transition to "running" within timeout.
it('should accept text in prompt textarea', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.waitForDisplayed({ timeout: 5000 });
await textarea.setValue('Say hello');
await browser.pause(200);
const value = await textarea.getValue();
expect(value).toBe('Say hello');
// Clear without submitting
await textarea.clearValue();
});
it('should enable submit button when prompt has text', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.setValue('Test prompt');
await browser.pause(200);
// Submit button should be interactable (not disabled)
const isDisabled = await browser.execute(() => {
const btn = document.querySelector('[data-testid="agent-submit"]');
if (!btn) return true;
return (btn as HTMLButtonElement).disabled;
});
expect(isDisabled).toBe(false);
await textarea.clearValue();
});
it('should show stop button during agent execution (if Claude available)', async function () {
// Send a minimal prompt
await sendAgentPrompt('Reply with exactly: AGOR_TEST_OK');
// Wait for running status (generous timeout for sidecar spin-up)
try {
await waitForAgentStatus('running', 15_000);
} catch {
// Claude CLI not available — skip remaining assertions
console.log('Agent did not start — Claude CLI may not be available. Skipping.');
this.skip();
return;
}
// If agent is still running, check for stop button
const status = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'unknown';
});
if (status === 'running') {
const stopBtn = await browser.$('[data-testid="agent-stop"]');
await expect(stopBtn).toBeDisplayed();
}
// Wait for completion (with shorter timeout to avoid mocha timeout)
try {
await waitForAgentStatus('idle', 40_000);
} catch {
console.log('Agent did not complete within 40s — skipping completion checks.');
this.skip();
return;
}
// Messages area should now have content
const msgCount = await browser.execute(() => {
const area = document.querySelector('[data-testid="agent-messages"]');
if (!area) return 0;
return area.children.length;
});
expect(msgCount).toBeGreaterThan(0);
});
});

View file

@ -0,0 +1,210 @@
import { browser, expect } from '@wdio/globals';
// Phase A — Agent: Agent pane initial state + prompt submission + NEW agent tests.
// Shares a single Tauri app session with other phase-a-* spec files.
// ─── Helpers ──────────────────────────────────────────────────────────
async function waitForAgentStatus(status: string, timeout = 30_000): Promise<void> {
await browser.waitUntil(
async () => {
const attr = await browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'idle';
});
return attr === status;
},
{ timeout, timeoutMsg: `Agent did not reach status "${status}" within ${timeout}ms` },
);
}
async function agentPaneExists(): Promise<boolean> {
const el = await browser.$('[data-testid="agent-pane"]');
return el.isExisting();
}
async function sendAgentPrompt(text: string): Promise<void> {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.waitForDisplayed({ timeout: 5000 });
await textarea.setValue(text);
await browser.pause(200);
const submitBtn = await browser.$('[data-testid="agent-submit"]');
await browser.execute((el) => (el as HTMLElement).click(), submitBtn);
}
async function getAgentStatus(): Promise<string> {
return browser.execute(() => {
const el = document.querySelector('[data-testid="agent-pane"]');
return el?.getAttribute('data-agent-status') ?? 'unknown';
});
}
async function getMessageCount(): Promise<number> {
return browser.execute(() => {
const area = document.querySelector('[data-testid="agent-messages"]');
return area ? area.children.length : 0;
});
}
// ─── Scenario 3: Agent pane initial state ────────────────────────────
describe('Scenario 3 — Agent Pane Initial State', () => {
it('should display agent pane in idle status', async () => {
if (!(await agentPaneExists())) {
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
}
const pane = await browser.$('[data-testid="agent-pane"]');
await expect(pane).toBeExisting();
expect(await getAgentStatus()).toBe('idle');
});
it('should show prompt textarea', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await expect(textarea).toBeDisplayed();
});
it('should show submit button', async () => {
const btn = await browser.$('[data-testid="agent-submit"]');
await expect(btn).toBeExisting();
});
it('should have empty messages area initially', async () => {
const msgArea = await browser.$('[data-testid="agent-messages"]');
await expect(msgArea).toBeExisting();
const msgCount = await browser.execute(() => {
const area = document.querySelector('[data-testid="agent-messages"]');
return area ? area.querySelectorAll('.message').length : 0;
});
expect(msgCount).toBe(0);
});
it('should show agent provider name or badge', async () => {
const hasContent = await browser.execute(() => {
const session = document.querySelector('[data-testid="agent-session"]');
return session !== null && (session.textContent ?? '').length > 0;
});
expect(hasContent).toBe(true);
});
it('should show session ID or cost display area', async () => {
const hasCostArea = await browser.execute(() => {
const pane = document.querySelector('[data-testid="agent-pane"]');
if (!pane) return false;
return (pane.querySelector('.cost-bar') || pane.querySelector('.status-strip')) !== null;
});
expect(hasCostArea).toBe(true);
});
it('should show context meter (token usage bar)', async () => {
const has = await browser.execute(() => {
const pane = document.querySelector('[data-testid="agent-pane"]');
if (!pane) return false;
return (pane.querySelector('.context-meter') || pane.querySelector('.usage-meter')) !== null;
});
expect(has).toBe(true);
});
it('should have tool call/result collapsible sections area', async () => {
const ready = await browser.execute(() => {
const area = document.querySelector('[data-testid="agent-messages"]');
return area !== null && area instanceof HTMLElement;
});
expect(ready).toBe(true);
});
});
// ─── Scenario 7: Agent prompt interaction (requires Claude CLI) ──────
describe('Scenario 7 — Agent Prompt Submission', () => {
it('should accept text in prompt textarea', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.waitForDisplayed({ timeout: 5000 });
await textarea.setValue('Say hello');
await browser.pause(200);
expect(await textarea.getValue()).toBe('Say hello');
await textarea.clearValue();
});
it('should enable submit button when prompt has text', async () => {
const textarea = await browser.$('[data-testid="agent-prompt"]');
await textarea.setValue('Test prompt');
await browser.pause(200);
const isDisabled = await browser.execute(() => {
const btn = document.querySelector('[data-testid="agent-submit"]');
return btn ? (btn as HTMLButtonElement).disabled : true;
});
expect(isDisabled).toBe(false);
await textarea.clearValue();
});
it('should show stop button during agent execution (if Claude available)', async function () {
await sendAgentPrompt('Reply with exactly: AGOR_TEST_OK');
try { await waitForAgentStatus('running', 15_000); } catch {
console.log('Agent did not start — Claude CLI may not be available. Skipping.');
this.skip(); return;
}
const status = await getAgentStatus();
if (status === 'running') {
const stopBtn = await browser.$('[data-testid="agent-stop"]');
await expect(stopBtn).toBeDisplayed();
}
try { await waitForAgentStatus('idle', 40_000); } catch {
console.log('Agent did not complete within 40s — skipping completion checks.');
this.skip(); return;
}
expect(await getMessageCount()).toBeGreaterThan(0);
});
it('should show agent status transitions (idle -> running -> idle)', async function () {
expect(await getAgentStatus()).toBe('idle');
await sendAgentPrompt('Reply with one word: OK');
try { await waitForAgentStatus('running', 15_000); } catch {
console.log('Agent did not start — skipping status transition test.');
this.skip(); return;
}
expect(await getAgentStatus()).toBe('running');
try { await waitForAgentStatus('idle', 40_000); } catch {
this.skip(); return;
}
expect(await getAgentStatus()).toBe('idle');
});
it('should show message count increasing during execution', async function () {
const countBefore = await getMessageCount();
await sendAgentPrompt('Reply with exactly: AGOR_MSG_COUNT_TEST');
try { await waitForAgentStatus('running', 15_000); } catch {
this.skip(); return;
}
try { await waitForAgentStatus('idle', 40_000); } catch {
this.skip(); return;
}
expect(await getMessageCount()).toBeGreaterThan(countBefore);
});
it('should disable prompt input while agent is running', async function () {
await sendAgentPrompt('Reply with exactly: AGOR_DISABLE_TEST');
try { await waitForAgentStatus('running', 15_000); } catch {
this.skip(); return;
}
const uiState = await browser.execute(() => {
const textarea = document.querySelector('[data-testid="agent-prompt"]') as HTMLTextAreaElement | null;
const stopBtn = document.querySelector('[data-testid="agent-stop"]');
return {
textareaDisabled: textarea?.disabled ?? false,
stopBtnVisible: stopBtn !== null && (stopBtn as HTMLElement).offsetParent !== null,
};
});
expect(uiState.textareaDisabled || uiState.stopBtnVisible).toBe(true);
try { await waitForAgentStatus('idle', 40_000); } catch {
await browser.execute(() => {
const btn = document.querySelector('[data-testid="agent-stop"]');
if (btn) (btn as HTMLElement).click();
});
await browser.pause(2000);
}
});
});

View file

@ -0,0 +1,297 @@
import { browser, expect } from '@wdio/globals';
// Phase A — Navigation: Terminal tabs + command palette + project focus + NEW tests.
// Shares a single Tauri app session with other phase-a-* spec files.
describe('Scenario 4 — Terminal Tab Management (data-testid)', () => {
before(async () => {
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
// Expand terminal section
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
if (toggle) (toggle as HTMLElement).click();
});
await browser.pause(500);
});
it('should display terminal tabs container', async () => {
const tabs = await browser.$('[data-testid="terminal-tabs"]');
await expect(tabs).toBeDisplayed();
});
it('should add a shell tab via data-testid button', async () => {
await browser.execute(() => {
const btn = document.querySelector('[data-testid="tab-add"]');
if (btn) (btn as HTMLElement).click();
});
await browser.pause(500);
const tabTitle = await browser.execute(() => {
const el = document.querySelector('.tab-bar .tab-title');
return el?.textContent ?? '';
});
expect(tabTitle.toLowerCase()).toContain('shell');
});
it('should show active tab styling', async () => {
const activeTab = await browser.$('.tab.active');
await expect(activeTab).toBeExisting();
});
it('should close tab and show empty state', async () => {
await browser.execute(() => {
document.querySelectorAll('.tab-close').forEach(btn => (btn as HTMLElement).click());
});
await browser.pause(500);
const emptyBtn = await browser.$('.add-first');
await expect(emptyBtn).toBeDisplayed();
});
it('should show terminal toggle chevron', async () => {
const has = await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
return toggle?.querySelector('.toggle-chevron') !== null;
});
expect(has).toBe(true);
});
it('should show agent preview button (eye icon) if agent session active', async () => {
const tabsExist = await browser.$('[data-testid="terminal-tabs"]');
await expect(tabsExist).toBeDisplayed();
// Preview button presence depends on active agent session
const hasPreviewBtn = await browser.execute(() => {
const tabs = document.querySelector('[data-testid="terminal-tabs"]');
return tabs?.querySelector('.tab-add.tab-agent-preview') !== null;
});
if (hasPreviewBtn) {
const withinTabs = await browser.execute(() => {
const tabs = document.querySelector('[data-testid="terminal-tabs"]');
return tabs?.querySelector('.tab-add.tab-agent-preview') !== null;
});
expect(withinTabs).toBe(true);
}
});
it('should maintain terminal state across project tab switches', async () => {
// Add a shell tab
await browser.execute(() => {
const btn = document.querySelector('[data-testid="tab-add"]');
if (btn) (btn as HTMLElement).click();
});
await browser.pause(500);
const countBefore = await browser.execute(() =>
document.querySelectorAll('.tab-bar .tab').length,
);
// Switch to Files tab and back
await browser.execute(() => {
const tabs = document.querySelectorAll('[data-testid="project-tabs"] .ptab');
if (tabs.length >= 2) (tabs[1] as HTMLElement).click();
});
await browser.pause(300);
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
const countAfter = await browser.execute(() =>
document.querySelectorAll('.tab-bar .tab').length,
);
expect(countAfter).toBe(countBefore);
// Clean up
await browser.execute(() => {
document.querySelectorAll('.tab-close').forEach(btn => (btn as HTMLElement).click());
});
await browser.pause(300);
});
after(async () => {
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
if (toggle?.querySelector('.toggle-chevron.expanded')) (toggle as HTMLElement).click();
});
await browser.pause(300);
});
});
describe('Scenario 5 — Command Palette (data-testid)', () => {
before(async () => {
await browser.execute(() => {
const p = document.querySelector('[data-testid="command-palette"]');
if (p && (p as HTMLElement).offsetParent !== null)
document.dispatchEvent(new KeyboardEvent('keydown', { key: 'Escape' }));
});
await browser.pause(200);
});
it('should open palette and show data-testid input', async () => {
await browser.execute(() => document.body.focus());
await browser.pause(200);
await browser.keys(['Control', 'k']);
const palette = await browser.$('[data-testid="command-palette"]');
await palette.waitForDisplayed({ timeout: 3000 });
const input = await browser.$('[data-testid="palette-input"]');
await expect(input).toBeDisplayed();
});
it('should have focused input', async () => {
const isFocused = await browser.execute(() => {
const el = document.querySelector('[data-testid="palette-input"]') as HTMLInputElement | null;
if (!el) return false;
el.focus();
return el === document.activeElement;
});
expect(isFocused).toBe(true);
});
it('should show at least one group item', async () => {
const items = await browser.$$('.palette-item');
expect(items.length).toBeGreaterThanOrEqual(1);
});
it('should filter and show no-results for nonsense query', async () => {
const input = await browser.$('[data-testid="palette-input"]');
await input.setValue('zzz_no_match_xyz');
await browser.pause(300);
const noResults = await browser.$('.no-results');
await expect(noResults).toBeDisplayed();
});
it('should show command categories in palette', async () => {
const input = await browser.$('[data-testid="palette-input"]');
await input.clearValue();
await browser.pause(300);
const catCount = await browser.execute(() =>
document.querySelectorAll('.palette-category').length,
);
expect(catCount).toBeGreaterThanOrEqual(1);
});
it('should execute palette command (e.g., toggle settings)', async () => {
const input = await browser.$('[data-testid="palette-input"]');
await input.clearValue();
await input.setValue('settings');
await browser.pause(300);
const executed = await browser.execute(() => {
const item = document.querySelector('.palette-item');
if (item) { (item as HTMLElement).click(); return true; }
return false;
});
expect(executed).toBe(true);
await browser.pause(500);
const paletteGone = await browser.execute(() => {
const p = document.querySelector('[data-testid="command-palette"]');
return p === null || (p as HTMLElement).offsetParent === null;
});
expect(paletteGone).toBe(true);
// Clean up
await browser.keys('Escape');
await browser.pause(300);
});
it('should show keyboard shortcut hints in palette items', async () => {
await browser.execute(() => document.body.focus());
await browser.pause(200);
await browser.keys(['Control', 'k']);
await browser.pause(300);
const has = await browser.execute(() =>
document.querySelectorAll('.palette-item .cmd-shortcut').length > 0,
);
expect(has).toBe(true);
});
it('should close on Escape', async () => {
await browser.keys('Escape');
const palette = await browser.$('[data-testid="command-palette"]');
await browser.waitUntil(async () => !(await palette.isDisplayed()), { timeout: 3000 });
});
});
describe('Scenario 6 — Project Focus & Tab Switching', () => {
before(async () => {
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
});
it('should focus project on header click', async () => {
await browser.execute(() => {
const header = document.querySelector('.project-header');
if (header) (header as HTMLElement).click();
});
await browser.pause(300);
const activeBox = await browser.$('.project-box.active');
await expect(activeBox).toBeDisplayed();
});
it('should switch to Files tab and back without losing agent session', async () => {
expect(await browser.execute(() =>
document.querySelector('[data-testid="agent-session"]') !== null,
)).toBe(true);
await browser.execute(() => {
const tabs = document.querySelectorAll('[data-testid="project-tabs"] .ptab');
if (tabs.length >= 2) (tabs[1] as HTMLElement).click();
});
await browser.pause(500);
expect(await browser.execute(() =>
document.querySelector('[data-testid="agent-session"]') !== null,
)).toBe(true);
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
const session = await browser.$('[data-testid="agent-session"]');
await expect(session).toBeDisplayed();
});
it('should preserve agent status across tab switches', async () => {
const statusBefore = await browser.execute(() =>
document.querySelector('[data-testid="agent-pane"]')?.getAttribute('data-agent-status') ?? 'unknown',
);
await browser.execute(() => {
const tabs = document.querySelectorAll('[data-testid="project-tabs"] .ptab');
if (tabs.length >= 3) (tabs[2] as HTMLElement).click();
});
await browser.pause(300);
await browser.execute(() => {
const tab = document.querySelector('[data-testid="project-tabs"] .ptab');
if (tab) (tab as HTMLElement).click();
});
await browser.pause(300);
const statusAfter = await browser.execute(() =>
document.querySelector('[data-testid="agent-pane"]')?.getAttribute('data-agent-status') ?? 'unknown',
);
expect(statusAfter).toBe(statusBefore);
});
it('should show tab count badge in terminal toggle', async () => {
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
if (toggle) (toggle as HTMLElement).click();
});
await browser.pause(300);
await browser.execute(() => {
const btn = document.querySelector('[data-testid="tab-add"]');
if (btn) (btn as HTMLElement).click();
});
await browser.pause(500);
const text = await browser.execute(() =>
document.querySelector('[data-testid="terminal-toggle"]')?.textContent?.trim() ?? '',
);
expect(text.length).toBeGreaterThan(0);
// Clean up
await browser.execute(() => {
document.querySelectorAll('.tab-close').forEach(btn => (btn as HTMLElement).click());
});
await browser.pause(300);
await browser.execute(() => {
const toggle = document.querySelector('[data-testid="terminal-toggle"]');
if (toggle?.querySelector('.toggle-chevron.expanded')) (toggle as HTMLElement).click();
});
await browser.pause(300);
});
});

View file

@ -0,0 +1,156 @@
import { browser, expect } from '@wdio/globals';
// Phase A — Structure: App structural integrity + settings panel + NEW structural tests.
// Shares a single Tauri app session with other phase-a-* spec files.
// ─── Scenario 1: App renders with project grid and data-testid anchors ───
describe('Scenario 1 — App Structural Integrity', () => {
it('should render the status bar with data-testid', async () => {
const bar = await browser.$('[data-testid="status-bar"]');
await expect(bar).toBeDisplayed();
});
it('should render the sidebar rail with data-testid', async () => {
const rail = await browser.$('[data-testid="sidebar-rail"]');
await expect(rail).toBeDisplayed();
});
it('should render at least one project box with data-testid', async () => {
const boxes = await browser.$$('[data-testid="project-box"]');
expect(boxes.length).toBeGreaterThanOrEqual(1);
});
it('should have data-project-id on project boxes', async () => {
const projectId = await browser.execute(() => {
const box = document.querySelector('[data-testid="project-box"]');
return box?.getAttribute('data-project-id') ?? null;
});
expect(projectId).not.toBeNull();
expect((projectId as string).length).toBeGreaterThan(0);
});
it('should render project tabs with data-testid', async () => {
const tabs = await browser.$('[data-testid="project-tabs"]');
await expect(tabs).toBeDisplayed();
});
it('should render agent session component', async () => {
const session = await browser.$('[data-testid="agent-session"]');
await expect(session).toBeDisplayed();
});
// ─── NEW structural tests ────────────────────────────────────────────
it('should render sidebar gear icon for settings', async () => {
const btn = await browser.$('[data-testid="settings-btn"]');
await expect(btn).toBeExisting();
await expect(btn).toBeDisplayed();
});
it('should have data-testid on status bar sections (agent-counts, cost, attention)', async () => {
// Status bar left section contains agent state items and attention
const leftItems = await browser.execute(() => {
const bar = document.querySelector('[data-testid="status-bar"]');
if (!bar) return { left: false, right: false };
const left = bar.querySelector('.left');
const right = bar.querySelector('.right');
return { left: left !== null, right: right !== null };
});
expect(leftItems.left).toBe(true);
expect(leftItems.right).toBe(true);
});
it('should render project accent colors (different per slot)', async () => {
const accents = await browser.execute(() => {
const boxes = document.querySelectorAll('[data-testid="project-box"]');
const styles: string[] = [];
boxes.forEach(box => {
const style = (box as HTMLElement).getAttribute('style') ?? '';
styles.push(style);
});
return styles;
});
// Each project box should have a --accent CSS variable
for (const style of accents) {
expect(style).toContain('--accent');
}
// If multiple boxes exist, accents should differ (cyclic assignment)
if (accents.length >= 2) {
// At least the first two should have different accent values
expect(accents[0]).not.toBe(accents[1]);
}
});
it('should show project name in header', async () => {
const name = await browser.execute(() => {
const el = document.querySelector('.project-header .project-name');
return el?.textContent?.trim() ?? '';
});
expect(name.length).toBeGreaterThan(0);
});
it('should show project icon in header', async () => {
const icon = await browser.execute(() => {
const el = document.querySelector('.project-header .project-icon');
return el?.textContent?.trim() ?? '';
});
// Icon should be a non-empty string (emoji or fallback folder icon)
expect(icon.length).toBeGreaterThan(0);
});
it('should have correct grid layout (project boxes fill available space)', async () => {
const layout = await browser.execute(() => {
const box = document.querySelector('[data-testid="project-box"]') as HTMLElement | null;
if (!box) return { width: 0, height: 0 };
const rect = box.getBoundingClientRect();
return { width: rect.width, height: rect.height };
});
// Project box should have non-trivial dimensions (fills grid slot)
expect(layout.width).toBeGreaterThan(100);
expect(layout.height).toBeGreaterThan(100);
});
});
// ─── Scenario 2: Settings panel via data-testid ──────────────────────
describe('Scenario 2 — Settings Panel (data-testid)', () => {
before(async () => {
// Ensure settings panel is closed before starting
await browser.execute(() => {
const panel = document.querySelector('.sidebar-panel');
if (panel && (panel as HTMLElement).offsetParent !== null) {
document.dispatchEvent(new KeyboardEvent('keydown', { key: 'Escape' }));
}
});
await browser.pause(300);
});
it('should open settings via data-testid button', async () => {
// Use JS click for reliability with WebKit2GTK/tauri-driver
await browser.execute(() => {
const btn = document.querySelector('[data-testid="settings-btn"]');
if (btn) (btn as HTMLElement).click();
});
const panel = await browser.$('.sidebar-panel');
await panel.waitForDisplayed({ timeout: 5000 });
// Wait for settings content to mount
await browser.waitUntil(
async () => {
const count = await browser.execute(() =>
document.querySelectorAll('.settings-tab .settings-section').length,
);
return (count as number) >= 1;
},
{ timeout: 5000 },
);
await expect(panel).toBeDisplayed();
});
it('should close settings with Escape', async () => {
await browser.keys('Escape');
const panel = await browser.$('.sidebar-panel');
await panel.waitForDisplayed({ timeout: 3000, reverse: true });
});
});

View file

@ -45,8 +45,11 @@ export const config = {
resolve(projectRoot, 'tests/e2e/specs/settings.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/features.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/terminal-theme.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/agent-scenarios.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-b.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-a-structure.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-a-agent.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-a-navigation.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-b-grid.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-b-llm.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-c-ui.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-c-tabs.test.ts'),
resolve(projectRoot, 'tests/e2e/specs/phase-c-llm.test.ts'),