docs: add setup and API guides and align scraper run actions

saifyxpro · saifyxpro · commit 78e2efb56f5b · 2026-03-16T09:16:35.000+05:00
diff --git a/README.md b/README.md
@@ -290,7 +290,7 @@ All three commands now resolve to the same root dev target.
 
 ### 🐳 Docker Deployment
 
-HeadlessX can be easily deployed using Docker Compose. See the [Docker Setup Guide](docs/docker_setup.md) for detailed instructions.
+HeadlessX can be easily deployed using Docker Compose. See the [Setup Guide](docs/setup-guide.md) for detailed instructions.
 
 ```bash
 # Start the application in detached mode
@@ -361,6 +361,8 @@ WEB_PORT=3000 pnpm --filter headlessx-web dev
 
 ## 🌐 API Endpoints
 
+For the full backend route inventory, see [docs/api-endpoints.md](docs/api-endpoints.md).
+
 ### Website Scraping APIs
 
 | Endpoint                  | Method | Description                  |
diff --git a/apps/web/src/components/playground/exa/config/ActionButtons.tsx b/apps/web/src/components/playground/exa/config/ActionButtons.tsx
@@ -14,7 +14,7 @@ export function ActionButtons({ disabled = false, isPending, onRun, onStop }: Ac
                 type="button"
                 onClick={onRun}
                 disabled={disabled || isPending}
-                className="inline-flex h-12 items-center justify-center rounded-2xl bg-slate-900 px-5 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"
+                className="inline-flex h-12 items-center justify-center rounded-2xl bg-primary px-5 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"
             >
                 Run Search
             </button>
diff --git a/apps/web/src/components/playground/google-serp/ConfigurationPanel.tsx b/apps/web/src/components/playground/google-serp/ConfigurationPanel.tsx
@@ -118,7 +118,7 @@ export function ConfigurationPanel({
                             <button
                                 type="submit"
                                 disabled={!query.trim() || isLoading}
-                                className="inline-flex w-full items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"
+                                className="inline-flex w-full items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"
                             >
                                 {isLoading ? (
                                     <>
diff --git a/apps/web/src/components/playground/tavily/config/ActionButtons.tsx b/apps/web/src/components/playground/tavily/config/ActionButtons.tsx
@@ -28,7 +28,7 @@ export function ActionButtons({
                 type="button"
                 onClick={onRun}
                 disabled={isPending || !hasQuery || !hasApiKey}
-                className="inline-flex items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"
+                className="inline-flex items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"
             >
                 <HugeiconsIcon icon={ButtonIcon} className="h-4 w-4" />
                 {buttonLabel}
diff --git a/apps/web/src/components/playground/website/config/ActionButtons.tsx b/apps/web/src/components/playground/website/config/ActionButtons.tsx
@@ -29,7 +29,7 @@ export function ActionButtons({
                 type="button"
                 onClick={onRun}
                 disabled={isPending || !hasUrl}
-                className="inline-flex items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"
+                className="inline-flex items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"
             >
                 <HugeiconsIcon icon={tool === 'map' ? LinkSquare01Icon : SparklesIcon} className="h-4 w-4" />
                 {buttonLabel}
diff --git a/apps/web/src/components/playground/youtube/config/ActionButtons.tsx b/apps/web/src/components/playground/youtube/config/ActionButtons.tsx
@@ -14,7 +14,7 @@ export function ActionButtons({ disabled = false, isPending, onRun, onStop }: Ac
                 type="button"
                 onClick={onRun}
                 disabled={disabled || isPending}
-                className="inline-flex h-12 items-center justify-center rounded-2xl bg-slate-900 px-5 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"
+                className="inline-flex h-12 items-center justify-center rounded-2xl bg-primary px-5 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"
             >
                 Extract
             </button>
diff --git a/docs/api-endpoints.md b/docs/api-endpoints.md
@@ -0,0 +1,176 @@
+# API Endpoints
+
+This document describes the backend HTTP surface for `apps/api` in HeadlessX.
+
+It is based on the current route tree mounted in `apps/api/src/app.ts`.
+
+## Backend System Summary
+
+- Runtime: Express 5 API with TypeScript
+- Persistence: PostgreSQL via Prisma
+- Auth: `x-api-key` guard on all non-health routes
+- Async jobs: BullMQ with Redis and a separate worker process
+- Browser scraping: Camoufox and Playwright services
+- External integrations: Tavily, Exa, yt-engine, HTML-to-Markdown service
+
+## Auth And Transport
+
+- Public route: `GET /api/health`
+- Protected routes: every other `/api/*` endpoint requires `x-api-key`
+- Internal dashboard traffic can use `DASHBOARD_INTERNAL_API_KEY`
+- SSE endpoints use `text/event-stream`
+
+Common SSE event names in this backend:
+
+- `start`
+- `progress`
+- `result`
+- `error`
+- `done`
+
+Google SERP currently ends its stream with `end` instead of `done`.
+
+## Dependency Notes
+
+| Area | Requirement |
+| --- | --- |
+| `/api/jobs/*` | Redis plus the queue worker |
+| `/api/website/crawl` | Redis plus the queue worker |
+| `/api/website/content` | Uses `HTML_TO_MARKDOWN_SERVICE_URL` when available, then falls back locally |
+| `/api/tavily/*` | `TAVILY_API_KEY` |
+| `/api/exa/*` | `EXA_API_KEY` |
+| `/api/youtube/*` | `YT_ENGINE_URL` |
+| most protected routes | PostgreSQL for API keys, logs, settings, proxies, and persisted data |
+
+## Core Endpoints
+
+| Method | Path | Purpose |
+| --- | --- | --- |
+| `GET` | `/api/health` | Public health check and route summary |
+| `GET` | `/api/config` | Read current system settings |
+| `PATCH` | `/api/config` | Update system settings and restart browser runtime |
+| `GET` | `/api/dashboard/stats` | Read dashboard summary metrics |
+| `GET` | `/api/logs` | List paginated request logs |
+| `GET` | `/api/logs/stats` | Read aggregated request log stats |
+| `GET` | `/api/keys` | List API keys |
+| `POST` | `/api/keys` | Create API key |
+| `PATCH` | `/api/keys/:id/revoke` | Revoke API key |
+| `DELETE` | `/api/keys/:id` | Delete API key |
+
+## Proxy Endpoints
+
+| Method | Path | Purpose |
+| --- | --- | --- |
+| `GET` | `/api/proxies` | List all proxies |
+| `GET` | `/api/proxies/active` | List active proxies only |
+| `GET` | `/api/proxies/:id` | Read one proxy |
+| `POST` | `/api/proxies` | Create proxy |
+| `PATCH` | `/api/proxies/:id` | Update proxy |
+| `DELETE` | `/api/proxies/:id` | Delete proxy |
+| `POST` | `/api/proxies/:id/toggle` | Toggle active state |
+| `POST` | `/api/proxies/:id/test` | Test proxy connectivity |
+
+## Website Scraper Endpoints
+
+| Method | Path | Purpose | Notes |
+| --- | --- | --- | --- |
+| `POST` | `/api/website/scrape` | SSE website scrape | Primary streaming scrape route |
+| `POST` | `/api/website/stream` | SSE website scrape | Legacy alias of `/scrape` |
+| `POST` | `/api/website/map` | Discover links quickly | Non-streaming |
+| `POST` | `/api/website/map/stream` | Stream site discovery progress | SSE |
+| `POST` | `/api/website/crawl` | Queue-backed crawl job | Requires Redis and worker |
+| `POST` | `/api/website/html` | Fast HTML scrape | No JS rendering |
+| `POST` | `/api/website/html-js` | JS-rendered HTML scrape | Browser-rendered |
+| `POST` | `/api/website/content` | Markdown content extraction | Uses markdown service when configured |
+| `POST` | `/api/website/screenshot` | Full-page screenshot | Binary image result |
+
+## Google SERP Endpoints
+
+| Method | Path | Purpose | Notes |
+| --- | --- | --- | --- |
+| `POST` | `/api/google-serp/search` | Standard Google result scrape | JSON response |
+| `GET` | `/api/google-serp/stream` | Stream Google search progress | SSE, expects query params like `query` and optional `timeout` |
+| `GET` | `/api/google-serp/status` | Service status | Lightweight availability check |
+
+## Tavily Endpoints
+
+| Method | Path | Purpose |
+| --- | --- | --- |
+| `POST` | `/api/tavily/search` | Tavily search |
+| `POST` | `/api/tavily/research` | Start Tavily research workflow |
+| `GET` | `/api/tavily/research/:requestId` | Poll Tavily research result |
+| `GET` | `/api/tavily/status` | Tavily configuration and status |
+
+## Exa Endpoints
+
+| Method | Path | Purpose | Notes |
+| --- | --- | --- | --- |
+| `POST` | `/api/exa/search` | Standard Exa search | JSON response |
+| `POST` | `/api/exa/search/stream` | Stream Exa search progress | SSE |
+| `GET` | `/api/exa/status` | Exa configuration and status | Lightweight availability check |
+
+## YouTube Endpoints
+
+| Method | Path | Purpose | Notes |
+| --- | --- | --- | --- |
+| `POST` | `/api/youtube/info/stream` | Stream YouTube extract flow | SSE |
+| `POST` | `/api/youtube/info` | Extract YouTube metadata | JSON response |
+| `POST` | `/api/youtube/formats` | Extract available format inventory | JSON response |
+| `POST` | `/api/youtube/subtitles` | Extract subtitles and captions | JSON response |
+| `POST` | `/api/youtube/save/stream` | Stream temporary download packaging | SSE |
+| `POST` | `/api/youtube/save` | Create temporary downloadable archive | JSON response |
+| `GET` | `/api/youtube/download/:jobId` | Download generated zip | Proxies yt-engine artifact |
+| `DELETE` | `/api/youtube/download/:jobId` | Delete temporary saved artifact | Cleanup endpoint |
+| `GET` | `/api/youtube/status` | yt-engine status | Fails if `YT_ENGINE_URL` is missing or unavailable |
+
+## Queue Job Endpoints
+
+| Method | Path | Purpose | Notes |
+| --- | --- | --- | --- |
+| `GET` | `/api/jobs` | List queue jobs | Filtered via query params |
+| `GET` | `/api/jobs/metrics` | Read queue metrics | BullMQ-backed |
+| `POST` | `/api/jobs` | Create generic queue job | Supports multiple job types |
+| `POST` | `/api/jobs/scrape` | Enqueue scrape job | Async |
+| `POST` | `/api/jobs/crawl` | Enqueue crawl job | Async |
+| `POST` | `/api/jobs/extract` | Enqueue extract job | Async |
+| `POST` | `/api/jobs/index` | Enqueue index job | Async |
+| `GET` | `/api/jobs/active` | Read currently active job | Checks stream jobs first, then queue |
+| `GET` | `/api/jobs/:id` | Read job status/result | Works for stream and queue jobs |
+| `GET` | `/api/jobs/:id/stream` | Reconnect to job progress stream | SSE |
+| `POST` | `/api/jobs/:id/cancel` | Cancel running or queued job | Uses active job manager / queue cancellation |
+
+## Legacy Compatibility Routes
+
+These routes are still mounted for backward compatibility.
+
+### `/api/v1`
+
+| Method | Path | Purpose |
+| --- | --- | --- |
+| `POST` | `/api/v1/html` | Legacy HTML scrape |
+| `POST` | `/api/v1/html-js` | Legacy JS HTML scrape |
+| `POST` | `/api/v1/content` | Legacy content extraction |
+| `POST` | `/api/v1/screenshot` | Legacy screenshot |
+| `GET` | `/api/v1/config` | Legacy config read |
+| `PATCH` | `/api/v1/config` | Legacy config update |
+| `GET` | `/api/v1/logs` | Legacy request logs |
+| `GET` | `/api/v1/api-keys` | Legacy API key list |
+| `POST` | `/api/v1/api-keys` | Legacy API key create |
+
+### `/api/v2`
+
+| Method | Path | Purpose |
+| --- | --- | --- |
+| `POST` | `/api/v2/html` | V2 HTML scrape |
+| `POST` | `/api/v2/html-js` | V2 JS HTML scrape |
+| `POST` | `/api/v2/content` | V2 content extraction |
+| `POST` | `/api/v2/screenshot` | V2 screenshot |
+| `GET` | `/api/v2/config` | V2 config read |
+| `PATCH` | `/api/v2/config` | V2 config update |
+
+## Operational Notes
+
+- The API and worker are separate processes. Queue-backed endpoints may return `503` when Redis is unavailable.
+- Configuration changes invalidate cached settings and restart the browser service.
+- Website Crawl is not an inline scrape. It is a queued workflow.
+- The web dashboard talks to this API using the internal dashboard key on server-side requests.
diff --git a/docs/setup-guide.md b/docs/setup-guide.md

Original file line number	Diff line number	Diff line change
`@@ -14,7 +14,7 @@ export function ActionButtons({ disabled = false, isPending, onRun, onStop }: Ac`
`14`	`14`	`type="button"`
`15`	`15`	`onClick={onRun}`
`16`	`16`	`disabled={disabled \|\| isPending}`
`17`		`- className="inline-flex h-12 items-center justify-center rounded-2xl bg-slate-900 px-5 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"`
	`17`	`+ className="inline-flex h-12 items-center justify-center rounded-2xl bg-primary px-5 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:bg-slate-200 disabled:text-slate-500"`
`18`	`18`	`>`
`19`	`19`	`Run Search`
`20`	`20`	`</button>`
Original file line number	Diff line number	Diff line change
`@@ -118,7 +118,7 @@ export function ConfigurationPanel({`
`118`	`118`	`<button`
`119`	`119`	`type="submit"`
`120`	`120`	`disabled={!query.trim() \|\| isLoading}`
`121`		`- className="inline-flex w-full items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"`
	`121`	`+ className="inline-flex w-full items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"`
`122`	`122`	`>`
`123`	`123`	`{isLoading ? (`
`124`	`124`	`<>`
Original file line number	Diff line number	Diff line change
`@@ -28,7 +28,7 @@ export function ActionButtons({`
`28`	`28`	`type="button"`
`29`	`29`	`onClick={onRun}`
`30`	`30`	`disabled={isPending \|\| !hasQuery \|\| !hasApiKey}`
`31`		`- className="inline-flex items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"`
	`31`	`+ className="inline-flex items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"`
`32`	`32`	`>`
`33`	`33`	`<HugeiconsIcon icon={ButtonIcon} className="h-4 w-4" />`
`34`	`34`	`{buttonLabel}`
Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,7 @@ export function ActionButtons({`
`29`	`29`	`type="button"`
`30`	`30`	`onClick={onRun}`
`31`	`31`	`disabled={isPending \|\| !hasUrl}`
`32`		`- className="inline-flex items-center justify-center gap-2 rounded-2xl bg-slate-900 px-4 py-4 text-sm font-semibold text-white transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:opacity-60"`
	`32`	`+ className="inline-flex items-center justify-center gap-2 rounded-2xl bg-primary px-4 py-4 text-sm font-semibold text-primary-foreground transition-colors hover:bg-primary/90 disabled:cursor-not-allowed disabled:opacity-60"`
`33`	`33`	`>`
`34`	`34`	`<HugeiconsIcon icon={tool === 'map' ? LinkSquare01Icon : SparklesIcon} className="h-4 w-4" />`
`35`	`35`	`{buttonLabel}`