You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
* pnpm
* Scrape Page migration + prop adjustments
* Get Crawl Status migration
* Crawl migration and prop adjustments
* Version bumps and adjustments
* Typo fix
* Add example to additional options desc
* Fixing description with broken backticks
* pnpm
---------
Co-authored-by: Leo Vu <vunguyenhung@outlook.com>
description: "Crawls a given input URL and returns the contents of sub-pages. [See the documentation](https://docs.firecrawl.dev/api-reference/endpoint/crawl)",
7
-
version: "0.0.1",
7
+
description: "Crawls a given URL and returns the contents of sub-pages. [See the documentation](https://docs.firecrawl.dev/api-reference/endpoint/crawl-post)",
8
+
version: "1.0.0",
8
9
type: "action",
9
10
props: {
10
11
firecrawl,
@@ -14,180 +15,75 @@ export default {
14
15
"url",
15
16
],
16
17
},
17
-
includes: {
18
-
propDefinition: [
19
-
firecrawl,
20
-
"includes",
21
-
],
18
+
excludePaths: {
19
+
type: "string[]",
20
+
label: "Exclude Paths",
21
+
description: "URL pathname regex patterns that exclude matching URLs from the crawl. For example, a value of `blog/.*` for the URL `firecrawl.dev` will exclude any results matching that pattern, such as `https://www.firecrawl.dev/blog/firecrawl-launch-week-1-recap`",
22
22
optional: true,
23
23
},
24
-
excludes: {
25
-
propDefinition: [
26
-
firecrawl,
27
-
"excludes",
28
-
],
29
-
optional: true,
30
-
},
31
-
generateImgAltText: {
32
-
propDefinition: [
33
-
firecrawl,
34
-
"generateImgAltText",
35
-
],
36
-
optional: true,
37
-
},
38
-
returnOnlyUrls: {
39
-
propDefinition: [
40
-
firecrawl,
41
-
"returnOnlyUrls",
42
-
],
24
+
includePaths: {
25
+
type: "string[]",
26
+
label: "Include Paths",
27
+
description: "Similar to `Exclude Paths`, but if set, only the paths matching the specified patterns will be included",
43
28
optional: true,
44
29
},
45
30
maxDepth: {
46
-
propDefinition: [
47
-
firecrawl,
48
-
"maxDepth",
49
-
],
50
-
optional: true,
51
-
},
52
-
mode: {
53
-
propDefinition: [
54
-
firecrawl,
55
-
"mode",
56
-
],
31
+
type: "integer",
32
+
label: "Max Depth",
33
+
description: "Maximum depth to crawl relative to the entered URL",
57
34
optional: true,
58
35
},
59
36
ignoreSitemap: {
60
-
propDefinition: [
61
-
firecrawl,
62
-
"ignoreSitemap",
63
-
],
64
-
optional: true,
65
-
},
66
-
limit: {
67
-
propDefinition: [
68
-
firecrawl,
69
-
"limit",
70
-
],
71
-
optional: true,
72
-
},
73
-
allowBackwardCrawling: {
74
-
propDefinition: [
75
-
firecrawl,
76
-
"allowBackwardCrawling",
77
-
],
78
-
optional: true,
79
-
},
80
-
allowExternalContentLinks: {
81
-
propDefinition: [
82
-
firecrawl,
83
-
"allowExternalContentLinks",
84
-
],
37
+
type: "boolean",
38
+
label: "Ignore Sitemap",
39
+
description: "Ignore the website sitemap when crawling",
85
40
optional: true,
86
41
},
87
-
headers: {
88
-
propDefinition: [
89
-
firecrawl,
90
-
"headers",
91
-
],
42
+
ignoreQueryParameters: {
43
+
type: "boolean",
44
+
label: "Ignore Query Parameters",
45
+
description: "Do not re-scrape the same path with different (or none) query parameters",
92
46
optional: true,
93
47
},
94
-
includeHtml: {
95
-
propDefinition: [
96
-
firecrawl,
97
-
"includeHtml",
98
-
],
99
-
optional: true,
100
-
},
101
-
includeRawHtml: {
102
-
propDefinition: [
103
-
firecrawl,
104
-
"includeRawHtml",
105
-
],
106
-
optional: true,
107
-
},
108
-
onlyIncludeTags: {
109
-
propDefinition: [
110
-
firecrawl,
111
-
"onlyIncludeTags",
112
-
],
113
-
optional: true,
114
-
},
115
-
onlyMainContent: {
116
-
propDefinition: [
117
-
firecrawl,
118
-
"onlyMainContent",
119
-
],
120
-
optional: true,
121
-
},
122
-
removeTags: {
123
-
propDefinition: [
124
-
firecrawl,
125
-
"removeTags",
126
-
],
127
-
optional: true,
128
-
},
129
-
replaceAllPathsWithAbsolutePaths: {
130
-
propDefinition: [
131
-
firecrawl,
132
-
"replaceAllPathsWithAbsolutePaths",
133
-
],
48
+
limit: {
49
+
type: "integer",
50
+
label: "Limit",
51
+
description: "Maximum number of pages to crawl",
134
52
optional: true,
135
53
},
136
-
screenshot: {
137
-
propDefinition: [
138
-
firecrawl,
139
-
"screenshot",
140
-
],
54
+
allowBackwardLinks: {
55
+
type: "boolean",
56
+
label: "Allow Backward Links",
57
+
description: "Enables the crawler to navigate from a specific URL to previously linked pages",
141
58
optional: true,
142
59
},
143
-
fullPageScreenshot: {
144
-
propDefinition: [
145
-
firecrawl,
146
-
"fullPageScreenshot",
147
-
],
60
+
allowExternalLinks: {
61
+
type: "boolean",
62
+
label: "Allow External Links",
63
+
description: "Allows the crawler to follow links to external websites",
148
64
optional: true,
149
65
},
150
-
waitFor: {
66
+
additionalOptions: {
151
67
propDefinition: [
152
68
firecrawl,
153
-
"waitFor",
69
+
"additionalOptions",
154
70
],
155
-
optional: true,
71
+
description: "Additional parameters to send in the request. [https://docs.firecrawl.dev/api-reference/endpoint/crawl-post) for available parameters. Values will be parsed as JSON where applicable. For example, to add the `webhook` param, use the value `{\"webhook\": {\"url\": \"https://your-server-webhook-api.com\",\"headers\": {},\"metadata\": {},\"events\": [\"completed\"]}}`",
Copy file name to clipboardExpand all lines: components/firecrawl/actions/get-crawl-status/get-crawl-status.mjs
+4-4Lines changed: 4 additions & 4 deletions
Original file line number
Diff line number
Diff line change
@@ -2,9 +2,9 @@ import firecrawl from "../../firecrawl.app.mjs";
2
2
3
3
exportdefault{
4
4
key: "firecrawl-get-crawl-status",
5
-
name: "Get Crawl Status",
6
-
description: "Obtains the status and data from a previous crawl operation. [See the documentation](https://docs.firecrawl.dev/api-reference/endpoint/status)",
7
-
version: "0.0.1",
5
+
name: "Get Crawl Data",
6
+
description: "Obtains the status and data from a previous crawl operation. [See the documentation](https://docs.firecrawl.dev/api-reference/endpoint/crawl-get)",
7
+
version: "0.0.2",
8
8
type: "action",
9
9
props: {
10
10
firecrawl,
@@ -21,7 +21,7 @@ export default {
21
21
crawlId: this.crawlId,
22
22
});
23
23
24
-
$.export("$summary",`Successfully retrieved status for crawl ID: ${this.crawlId}`);
24
+
$.export("$summary",`Successfully retrieved status for crawl (ID: ${this.crawlId})`);
0 commit comments