Skip to content

Commit 8f944e3

Browse files
Merge pull request #238 from apify/feat/output-and-dataset-schema
chore: output schema
2 parents e5db3ae + 1886dd7 commit 8f944e3

4 files changed

Lines changed: 15 additions & 30 deletions

File tree

packages/actor-scraper/sitemap-scraper/.actor/actor.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@
33
"name": "sitemap-extractor",
44
"version": "0.1",
55
"buildTag": "latest",
6+
"output": "./output_schema.json",
67
"defaultMemoryMbytes": 1024,
78
"minMemoryMbytes": 256,
89
"maxMemoryMbytes": 4096,
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"actorOutputSchemaVersion": 1,
3+
"title": "Sitemap Extractor Output",
4+
"description": "Links to the default dataset containing extracted sitemap URLs and request metadata.",
5+
"properties": {
6+
"results": {
7+
"type": "string",
8+
"title": "Results",
9+
"description": "Dataset items with discovered URLs and crawl status.",
10+
"template": "{{links.apiDefaultDatasetUrl}}/items"
11+
}
12+
}
13+
}

packages/actor-scraper/sitemap-scraper/OUTPUT_SCHEMA.json

Lines changed: 0 additions & 29 deletions
This file was deleted.

packages/actor-scraper/sitemap-scraper/src/internals/crawler_setup.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ const REQUEST_QUEUE_INIT_FLAG_KEY = 'REQUEST_QUEUE_INITIALIZED';
5555
* instance and creating a context for a pageFunction invocation.
5656
*/
5757
export class CrawlerSetup {
58-
name = 'Sitemap Scraper';
58+
name = 'Sitemap Extractor';
5959
rawInput: string;
6060
env: ApifyEnv;
6161
/**

0 commit comments

Comments
 (0)