feat: add typed API responses and fix sync/async endpoint classification

FrancescoSaverioZuppichini · claude · FrancescoSaverioZuppichini · commit f40c5f9e5ee3 · 2026-02-17T11:47:24.000+01:00
Replace ApiResult&lt;unknown&gt; with proper response types for all endpoints.
Only crawl uses polling now — all other endpoints are direct POST calls.

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/README.md b/README.md
@@ -11,16 +11,26 @@ Command-line interface for [ScrapeGraph AI](https://scrapegraphai.com) — AI-po
 
 ```
 just-scrape/
+├── docs/                            # API response docs per endpoint
+│   ├── smartscraper.md
+│   ├── searchscraper.md
+│   ├── markdownify.md
+│   ├── crawl.md
+│   ├── scrape.md
+│   ├── agenticscraper.md
+│   ├── generate-schema.md
+│   ├── sitemap.md
+│   └── credits.md
 ├── src/
 │   ├── cli.ts                       # Entry point, citty main command + subcommands
 │   ├── lib/
 │   │   ├── env.ts                   # Zod-parsed env config (API key, debug, timeout)
 │   │   ├── folders.ts               # API key resolution + interactive prompt
-│   │   ├── scrapegraphai.ts         # SDK layer — all API functions
+│   │   ├── scrapegraphai.ts         # SDK layer — all API functions (typed responses)
 │   │   ├── schemas.ts               # Zod validation schemas
 │   │   └── log.ts                   # Logger factory + syntax-highlighted JSON output
 │   ├── types/
-│   │   └── index.ts                 # Zod-derived types + ApiResult
+│   │   └── index.ts                 # Zod-derived types + ApiResult + response types
 │   ├── commands/
 │   │   ├── smart-scraper.ts
 │   │   ├── search-scraper.ts
diff --git a/docs/agenticscraper.md b/docs/agenticscraper.md
@@ -0,0 +1,27 @@
+# Agentic Scraper
+
+Browser automation with AI — login, click, navigate, fill forms, extract data.
+
+**Endpoint:** `POST /v1/agentic-scrapper`
+**Poll:** `GET /v1/agentic-scrapper/{request_id}`
+**Docs:** https://docs.scrapegraphai.com/services/agenticscraper
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| url | string | Yes | Target URL |
+| steps | string[] | No | Browser action sequence |
+| user_prompt | string | No | AI extraction instructions |
+| output_schema | object | No | JSON schema for output structure |
+| ai_extraction | boolean | No | Enable AI-powered structuring |
+| use_session | boolean | No | Persist browser session |
+
+## Response (CompletedAgenticScraperResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `queued` \| `processing` \| `completed` \| `failed` |
+| result | object \| null | Extracted data or page markdown |
+| error | string | Error message (empty on success) |
diff --git a/docs/crawl.md b/docs/crawl.md
@@ -0,0 +1,41 @@
+# SmartCrawler (Crawl)
+
+Multi-page crawling with AI extraction or markdown conversion.
+
+**Endpoint:** `POST /v1/crawl`
+**Poll:** `GET /v1/crawl/{crawl_id}`
+**Credits:** 10/page (AI) or 2/page (markdown)
+**Docs:** https://docs.scrapegraphai.com/services/smartcrawler
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| url | string | Yes | Starting URL |
+| prompt | string | No | Extraction instructions |
+| extraction_mode | boolean | No | AI extraction (true) or markdown (false) |
+| max_pages | number | No | Max pages to crawl |
+| depth | number | No | Link depth to follow |
+| schema | object | No | JSON schema for output structure |
+| rules | object | No | Crawl rules (include_paths, exclude_paths, same_domain) |
+| sitemap | boolean | No | Use sitemap for discovery |
+| stealth | boolean | No | Anti-bot bypass (+4 credits) |
+| webhook_url | string | No | Webhook for completion notification |
+
+## Response (CompletedCrawlResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| crawl_id | string | Unique crawl identifier |
+| status | string | `queued` \| `processing` \| `done` \| `failed` |
+| result | object \| null | AI-extracted data (when extraction_mode=true) |
+| crawled_urls | string[] | All visited URLs |
+| pages | CrawlPage[] | Crawled pages with markdown content |
+| error | string | Error message (empty on success) |
+
+### CrawlPage
+
+| Field | Type | Description |
+|---|---|---|
+| url | string | Page URL |
+| markdown | string | Page content as markdown |
diff --git a/docs/credits.md b/docs/credits.md
@@ -0,0 +1,13 @@
+# Credits
+
+Check API credit balance.
+
+**Endpoint:** `GET /v1/credits`
+**Sync**
+
+## Response (CreditsResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| remaining_credits | number | Credits available |
+| total_credits_used | number | Total credits consumed |
diff --git a/docs/generate-schema.md b/docs/generate-schema.md
@@ -0,0 +1,26 @@
+# Generate Schema
+
+AI-powered JSON schema generation from natural language descriptions.
+
+**Endpoint:** `POST /v1/generate_schema`
+**Poll:** `GET /v1/generate_schema/{request_id}`
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| user_prompt | string | Yes | Schema description |
+| existing_schema | object | No | Existing schema to modify/extend |
+
+## Response (SchemaGenerationResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `pending` \| `processing` \| `completed` \| `failed` |
+| user_prompt | string | Original prompt |
+| refined_prompt | string \| null | AI-refined version of prompt |
+| generated_schema | object \| null | Generated JSON schema |
+| error | string \| null | Error message |
+| created_at | string \| null | ISO 8601 timestamp |
+| updated_at | string \| null | ISO 8601 timestamp |
diff --git a/docs/markdownify.md b/docs/markdownify.md
@@ -0,0 +1,27 @@
+# Markdownify
+
+Converts any webpage to clean, well-formatted markdown.
+
+**Endpoint:** `POST /v1/markdownify`
+**Poll:** `GET /v1/markdownify/{request_id}`
+**Credits:** 2/page
+**Docs:** https://docs.scrapegraphai.com/services/markdownify
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| website_url | string | Yes | Target URL |
+| stealth | boolean | No | Anti-bot bypass (+4 credits) |
+| headers | object | No | Custom HTTP headers |
+| webhook_url | string | No | Webhook for completion notification |
+
+## Response (CompletedMarkdownifyResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `queued` \| `processing` \| `completed` \| `failed` |
+| website_url | string | Processed URL |
+| result | string \| null | Converted markdown content |
+| error | string | Error message (empty on success) |
diff --git a/docs/scrape.md b/docs/scrape.md
@@ -0,0 +1,27 @@
+# Scrape
+
+Raw HTML extraction with optional branding analysis.
+
+**Endpoint:** `POST /v1/scrape`
+**Poll:** `GET /v1/scrape/{request_id}`
+**Credits:** 1/page (+2 branding, +4 stealth)
+**Docs:** https://docs.scrapegraphai.com/services/scrape
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| website_url | string | Yes | Target URL |
+| stealth | boolean | No | Anti-bot bypass (+4 credits) |
+| branding | boolean | No | Extract design elements (+2 credits) |
+| country_code | string | No | ISO country code for geo-targeting |
+
+## Response (CompletedScrapeResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `queued` \| `processing` \| `completed` \| `failed` |
+| html | string | Complete HTML content |
+| branding | object | Design elements (when branding=true) |
+| error | string | Error message (empty on success) |
diff --git a/docs/searchscraper.md b/docs/searchscraper.md
@@ -0,0 +1,31 @@
+# SearchScraper
+
+AI-powered web search that aggregates information from multiple sources.
+
+**Endpoint:** `POST /v1/searchscraper`
+**Poll:** `GET /v1/searchscraper/{request_id}`
+**Credits:** 10/page (AI extraction) or 2/page (markdown mode)
+**Docs:** https://docs.scrapegraphai.com/services/searchscraper
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| user_prompt | string | Yes | Search query |
+| num_results | number | No | Sources to scrape (3-20) |
+| extraction_mode | boolean | No | AI extraction (true) or markdown mode (false) |
+| output_schema | object | No | JSON schema for output structure |
+| stealth | boolean | No | Anti-bot bypass (+4 credits) |
+| headers | object | No | Custom HTTP headers |
+| webhook_url | string | No | Webhook for completion notification |
+
+## Response (CompletedSearchScraperResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `queued` \| `processing` \| `completed` \| `failed` |
+| user_prompt | string | Original search query |
+| result | object \| null | Extracted/structured data |
+| reference_urls | string[] | Source URLs used |
+| error | string | Error message (empty on success) |
diff --git a/docs/sitemap.md b/docs/sitemap.md
@@ -0,0 +1,23 @@
+# Sitemap
+
+Extracts all URLs from a website's sitemap.xml.
+
+**Endpoint:** `POST /v1/sitemap`
+**Sync** (no polling)
+**Docs:** https://docs.scrapegraphai.com/services/sitemap
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| website_url | string | Yes | Target website URL |
+
+## Response (SitemapResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Request identifier |
+| status | string | Completion status |
+| website_url | string | Processed URL |
+| urls | string[] | Discovered URLs |
+| error | string | Error message (empty on success) |
diff --git a/docs/smartscraper.md b/docs/smartscraper.md
@@ -0,0 +1,36 @@
+# SmartScraper
+
+AI-powered web scraping that extracts structured data from any website.
+
+**Endpoint:** `POST /v1/smartscraper`
+**Poll:** `GET /v1/smartscraper/{request_id}`
+**Credits:** 10/page
+**Docs:** https://docs.scrapegraphai.com/services/smartscraper
+
+## Request
+
+| Parameter | Type | Required | Description |
+|---|---|---|---|
+| website_url | string | Yes* | Target URL (*one of three inputs) |
+| website_html | string | No | Raw HTML (max 2MB, mutually exclusive) |
+| website_markdown | string | No | Markdown content (max 2MB, mutually exclusive) |
+| user_prompt | string | Yes | Extraction instructions |
+| output_schema | object | No | JSON schema for output structure |
+| number_of_scrolls | number | No | Infinite scroll iterations (0-100) |
+| total_pages | number | No | Pagination depth (1-100) |
+| stealth | boolean | No | Anti-bot bypass (+4 credits) |
+| cookies | object | No | Session cookies |
+| headers | object | No | Custom HTTP headers |
+| plain_text | boolean | No | Return plaintext instead of JSON |
+| webhook_url | string | No | Webhook for completion notification |
+
+## Response (CompletedSmartscraperResponse)
+
+| Field | Type | Description |
+|---|---|---|
+| request_id | string | Unique request identifier |
+| status | string | `queued` \| `processing` \| `completed` \| `failed` |
+| website_url | string | Processed URL |
+| user_prompt | string | Original prompt |
+| result | object \| null | Extracted data matching schema |
+| error | string | Error message (empty on success) |
diff --git a/src/commands/agentic-scraper.ts b/src/commands/agentic-scraper.ts
@@ -43,7 +43,7 @@ export default defineCommand({
 		if (args["use-session"]) params.use_session = true;
 
 		out.start("Running browser automation");
-		const result = await scrapegraphai.agenticScraper(key, params, out.poll);
+		const result = await scrapegraphai.agenticScraper(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/commands/generate-schema.ts b/src/commands/generate-schema.ts
@@ -28,7 +28,7 @@ export default defineCommand({
 		if (args["existing-schema"]) params.existing_schema = JSON.parse(args["existing-schema"]);
 
 		out.start("Generating schema");
-		const result = await scrapegraphai.generateSchema(key, params, out.poll);
+		const result = await scrapegraphai.generateSchema(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/commands/markdownify.ts b/src/commands/markdownify.ts
@@ -31,7 +31,7 @@ export default defineCommand({
 		if (args.headers) params.headers = JSON.parse(args.headers);
 
 		out.start("Converting to markdown");
-		const result = await scrapegraphai.markdownify(key, params, out.poll);
+		const result = await scrapegraphai.markdownify(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/commands/scrape.ts b/src/commands/scrape.ts
@@ -31,7 +31,7 @@ export default defineCommand({
 		if (args["country-code"]) params.country_code = args["country-code"];
 
 		out.start("Scraping");
-		const result = await scrapegraphai.scrape(key, params, out.poll);
+		const result = await scrapegraphai.scrape(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/commands/search-scraper.ts b/src/commands/search-scraper.ts
@@ -43,7 +43,7 @@ export default defineCommand({
 		if (args.headers) params.headers = JSON.parse(args.headers);
 
 		out.start("Searching");
-		const result = await scrapegraphai.searchScraper(key, params, out.poll);
+		const result = await scrapegraphai.searchScraper(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/commands/smart-scraper.ts b/src/commands/smart-scraper.ts
@@ -48,7 +48,7 @@ export default defineCommand({
 		if (args["plain-text"]) params.plain_text = true;
 
 		out.start("Scraping");
-		const result = await scrapegraphai.smartScraper(key, params, out.poll);
+		const result = await scrapegraphai.smartScraper(key, params);
 		out.stop(result.elapsedMs);
 
 		if (result.data) out.result(result.data);
diff --git a/src/lib/scrapegraphai.ts b/src/lib/scrapegraphai.ts
diff --git a/src/types/index.ts b/src/types/index.ts
diff --git a/tests/scrapegraphai.test.ts b/tests/scrapegraphai.test.ts