brightdata
diff --git a/‎README.md‎
Lines changed: 56 additions & 0 deletions b/‎README.md‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎package.json‎
Lines changed: 1 addition & 1 deletion b/‎package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/__tests__/commands/discover.test.ts‎
Lines changed: 260 additions & 0 deletions b/‎src/__tests__/commands/discover.test.ts‎
Lines changed: 260 additions & 0 deletions
@@ -24,6 +24,7 @@
 |---|---|
 | `brightdata scrape` | Scrape any URL — bypasses CAPTCHAs, JS rendering, anti-bot protections |
 | `brightdata search` | Google / Bing / Yandex search with structured JSON output |
+| `brightdata discover` | AI-powered web discovery - find and rank results by intent with optional full-page content |
 | `brightdata pipelines` | Extract structured data from 40+ platforms (Amazon, LinkedIn, TikTok…) |
 | `brightdata browser` | Control a real browser via Bright Data's Scraping Browser — navigate, snapshot, click, type, and more |
 | `brightdata zones` | List and inspect your Bright Data proxy zones |
@@ -44,6 +45,7 @@
   - [init](#init)
   - [scrape](#scrape)
   - [search](#search)
+  - [discover](#discover)
   - [pipelines](#pipelines)
   - [browser](#browser)
   - [status](#status)
@@ -246,6 +248,60 @@ brightdata search "bright data pricing" --engine bing
 
 ---
 
+### `discover`
+
+AI-powered web discovery. Submit a query with optional intent, and Bright Data finds, ranks, and optionally extracts full-page content for each result.
+
+```bash
+brightdata discover <query> [options]
+```
+
+| Flag | Description |
+|---|---|
+| `--intent <text>` | AI intent to evaluate and rank result relevance |
+| `--country <code>` | ISO country code (default: `US`) |
+| `--city <name>` | City for localized results (e.g. `"New York"`) |
+| `--language <code>` | Language code (default: `en`) |
+| `--num-results <n>` | Number of results to return |
+| `--filter-keywords <words>` | Comma-separated keywords that must appear in results |
+| `--include-content` | Include full page content in each result |
+| `--no-remove-duplicates` | Keep duplicate results |
+| `--start-date <date>` | Only content updated from date (`YYYY-MM-DD`) |
+| `--end-date <date>` | Only content updated until date (`YYYY-MM-DD`) |
+| `--timeout <seconds>` | Polling timeout (default: `600`) |
+| `-o, --output <path>` | Write output to file |
+| `--json` / `--pretty` | JSON output (raw / indented) |
+| `-k, --api-key <key>` | Override API key |
+
+**Examples**
+
+```bash
+# Basic discovery — table output
+brightdata discover "AI trends"
+
+# With AI intent for relevance ranking
+brightdata discover "AI trends" \
+  --intent "Prioritize institutional reports for VC research"
+
+# Include full page content as markdown
+brightdata discover "AI trends" --include-content --num-results 5
+
+# Geo-targeted with date range
+brightdata discover "best restaurants" --country US --city "New York" \
+  --start-date 2025-01-01 --end-date 2025-12-31
+
+# Filter results by keywords
+brightdata discover "generative AI SaaS" --filter-keywords "revenue,SaaS"
+
+# JSON output to file
+brightdata discover "AI trends" --num-results 10 --pretty -o results.json
+
+# Pipe-friendly — redirected stdout outputs JSON automatically
+brightdata discover "AI trends" --include-content --num-results 3 > results.json
+```
+
+---
+
 ### `pipelines`
 
 Extract structured data from 40+ platforms using Bright Data's Web Scraper API. Triggers an async collection job, polls until ready, and returns results.
 
@@ -1,6 +1,6 @@
 {
     "name": "@brightdata/cli",
-    "version": "0.1.6",
+    "version": "0.1.7",
     "description": "Command-line interface for Bright Data. Scrape, search, extract structured data, and automate browsers directly from your terminal.",
     "main": "dist/index.js",
     "bin": {
 
@@ -0,0 +1,260 @@
+import {describe, it, expect, beforeEach, vi} from 'vitest';
+
+const mocks = vi.hoisted(()=>({
+    post: vi.fn(),
+    get: vi.fn(),
+    ensure_authenticated: vi.fn(),
+    stop: vi.fn(),
+    start: vi.fn(),
+    print: vi.fn(),
+    print_table: vi.fn(),
+    fail: vi.fn((msg: string)=>{ throw new Error(`fail:${msg}`); }),
+    dim: vi.fn((msg: string)=>msg),
+    parse_timeout: vi.fn(),
+    poll_until: vi.fn(),
+}));
+
+vi.mock('../../utils/client', ()=>({
+    post: mocks.post,
+    get: mocks.get,
+}));
+
+vi.mock('../../utils/auth', ()=>({
+    ensure_authenticated: mocks.ensure_authenticated,
+}));
+
+vi.mock('../../utils/spinner', ()=>({
+    start: mocks.start,
+}));
+
+vi.mock('../../utils/output', ()=>({
+    print: mocks.print,
+    print_table: mocks.print_table,
+    fail: mocks.fail,
+    dim: mocks.dim,
+}));
+
+vi.mock('../../utils/polling', ()=>({
+    parse_timeout: mocks.parse_timeout,
+    poll_until: mocks.poll_until,
+}));
+
+import {
+    handle_discover,
+    build_request,
+    extract_status,
+    format_markdown,
+    print_discover_table,
+} from '../../commands/discover';
+
+describe('commands/discover', ()=>{
+    beforeEach(()=>{
+        vi.clearAllMocks();
+        mocks.ensure_authenticated.mockReturnValue('api_key');
+        mocks.parse_timeout.mockReturnValue(600);
+        mocks.start.mockReturnValue({stop: mocks.stop});
+    });
+
+    describe('build_request', ()=>{
+        it('builds minimal request with only query', ()=>{
+            const req = build_request('AI trends', {});
+            expect(req).toEqual({query: 'AI trends'});
+        });
+
+        it('includes all optional params', ()=>{
+            const req = build_request('AI trends', {
+                intent: 'find research papers',
+                city: 'New York',
+                country: 'US',
+                language: 'en',
+                numResults: '10',
+                filterKeywords: 'AI, machine learning',
+                includeContent: true,
+                startDate: '2025-01-01',
+                endDate: '2025-12-31',
+            });
+            expect(req).toEqual({
+                query: 'AI trends',
+                intent: 'find research papers',
+                city: 'New York',
+                country: 'US',
+                language: 'en',
+                num_results: 10,
+                filter_keywords: ['AI', 'machine learning'],
+                include_content: true,
+                start_date: '2025-01-01',
+                end_date: '2025-12-31',
+            });
+        });
+
+        it('parses comma-separated filter keywords with whitespace', ()=>{
+            const req = build_request('q', {filterKeywords: ' a , b , c '});
+            expect(req.filter_keywords).toEqual(['a', 'b', 'c']);
+        });
+
+        it('does not set format by default (API returns JSON)', ()=>{
+            const req = build_request('test', {});
+            expect(req.format).toBeUndefined();
+        });
+
+        it('does not set format when include-content is used', ()=>{
+            const req = build_request('test', {includeContent: true});
+            expect(req.format).toBeUndefined();
+            expect(req.include_content).toBe(true);
+        });
+    });
+
+    describe('extract_status', ()=>{
+        it('returns status from valid response', ()=>{
+            expect(extract_status({status: 'processing'})).toBe('processing');
+            expect(extract_status({status: 'done'})).toBe('done');
+        });
+
+        it('returns undefined for invalid input', ()=>{
+            expect(extract_status(null as never)).toBeUndefined();
+            expect(extract_status(undefined as never)).toBeUndefined();
+        });
+    });
+
+    describe('format_markdown', ()=>{
+        it('formats results as markdown', ()=>{
+            const md = format_markdown([
+                {
+                    link: 'https://example.com',
+                    title: 'Example',
+                    description: 'A description',
+                    relevance_score: 0.95,
+                },
+            ], 'test query');
+            expect(md).toContain('# Discover results for "test query"');
+            expect(md).toContain('**1. [Example](https://example.com)** (95.0%)');
+            expect(md).toContain('A description');
+        });
+
+        it('includes content when present', ()=>{
+            const md = format_markdown([
+                {
+                    link: 'https://example.com',
+                    title: 'Example',
+                    description: 'Desc',
+                    relevance_score: 0.5,
+                    content: '# Page content here',
+                },
+            ], 'q');
+            expect(md).toContain('# Page content here');
+        });
+    });
+
+    describe('print_discover_table', ()=>{
+        it('calls print_table with formatted rows', ()=>{
+            const results = [
+                {
+                    link: 'https://example.com',
+                    title: 'Example Title',
+                    description: 'Desc',
+                    relevance_score: 0.98184747,
+                },
+            ];
+            print_discover_table(results);
+            expect(mocks.print_table).toHaveBeenCalledWith(
+                [{
+                    '#': '1',
+                    title: 'Example Title',
+                    score: '98.2%',
+                    url: 'https://example.com',
+                }],
+                ['#', 'title', 'score', 'url']
+            );
+        });
+
+        it('prints dim message when no results', ()=>{
+            const log = vi.spyOn(console, 'log').mockImplementation(()=>{});
+            print_discover_table([]);
+            expect(log).toHaveBeenCalled();
+            expect(mocks.print_table).not.toHaveBeenCalled();
+            log.mockRestore();
+        });
+    });
+
+    describe('handle_discover', ()=>{
+        it('triggers and polls then prints table', async()=>{
+            mocks.post.mockResolvedValue({status: 'ok', task_id: 'abc123'});
+            mocks.poll_until.mockResolvedValue({
+                result: {
+                    status: 'done',
+                    duration_seconds: 5,
+                    results: [
+                        {
+                            link: 'https://example.com',
+                            title: 'Result',
+                            description: 'Desc',
+                            relevance_score: 0.9,
+                        },
+                    ],
+                },
+                attempts: 3,
+            });
+            await handle_discover('AI trends', {});
+            expect(mocks.post).toHaveBeenCalledWith(
+                'api_key',
+                '/discover',
+                {query: 'AI trends'},
+                {timing: undefined}
+            );
+            expect(mocks.poll_until).toHaveBeenCalledTimes(1);
+            expect(mocks.print_table).toHaveBeenCalledTimes(1);
+        });
+
+        it('prints json when --json is set', async()=>{
+            const response = {
+                status: 'done',
+                duration_seconds: 2,
+                results: [{
+                    link: 'https://example.com',
+                    title: 'R',
+                    description: 'D',
+                    relevance_score: 0.8,
+                }],
+            };
+            mocks.post.mockResolvedValue({status: 'ok', task_id: 't1'});
+            mocks.poll_until.mockResolvedValue({result: response, attempts: 1});
+            await handle_discover('q', {json: true});
+            expect(mocks.print).toHaveBeenCalledWith(
+                response,
+                {json: true, pretty: undefined, output: undefined}
+            );
+            expect(mocks.print_table).not.toHaveBeenCalled();
+        });
+
+        it('prints raw JSON when --output is set', async()=>{
+            const response = {
+                status: 'done',
+                results: [{
+                    link: 'https://example.com',
+                    title: 'R',
+                    description: 'D',
+                    relevance_score: 0.7,
+                }],
+            };
+            mocks.post.mockResolvedValue({status: 'ok', task_id: 't2'});
+            mocks.poll_until.mockResolvedValue({result: response, attempts: 1});
+            await handle_discover('q', {output: 'out.json'});
+            expect(mocks.print).toHaveBeenCalledWith(
+                response,
+                {json: undefined, pretty: undefined, output: 'out.json'}
+            );
+        });
+
+        it('fails when trigger returns no task_id', async()=>{
+            mocks.post.mockResolvedValue({status: 'ok'});
+            const exit = vi.spyOn(process, 'exit')
+                .mockImplementation(()=>undefined as never);
+            const error = vi.spyOn(console, 'error')
+                .mockImplementation(()=>{});
+            await handle_discover('q', {});
+            expect(mocks.fail).toHaveBeenCalled();
+            exit.mockRestore();
+            error.mockRestore();
+        });
+    });
+});
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "@brightdata/cli",`
`3`		`- "version": "0.1.6",`
	`3`	`+ "version": "0.1.7",`
`4`	`4`	`"description": "Command-line interface for Bright Data. Scrape, search, extract structured data, and automate browsers directly from your terminal.",`
`5`	`5`	`"main": "dist/index.js",`
`6`	`6`	`"bin": {`