You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
.describe('Whether to enable JavaScript rendering. Enabling this may increase the time taken to retrieve the HTML skeleton.'),
33
-
page: z.number()
33
+
chunk: z.number()
34
34
.optional()
35
35
.default(1)
36
-
.describe('Page number to retrieve when paginating through content. Used to prevent exceeding the maximum tool output length.'),
36
+
.describe('Chunk number to retrieve when getting the content. The content is split into chunks to prevent exceeding the maximum tool output length.'),
37
37
});
38
38
39
39
exportconstgetHtmlSkeleton: ToolEntry={
40
40
type: 'internal',
41
41
tool: {
42
42
name: HelperTools.GET_HTML_SKELETON,
43
43
actorFullName: HelperTools.GET_HTML_SKELETON,
44
-
description: `Retrieves the HTML skeleton (clean structure) from a given URL by stripping unwanted elements like scripts, styles, and non-essential attributes. This tool keeps only the core HTML structure, links, images, and data attributes for analysis. Supports optional JavaScript rendering for dynamic content and provides paginated output to handle large pages. This tool is useful for building web scrapers and data extraction tasks where a clean HTML structure is needed for writing concrete selectors or parsers.`,
44
+
description: `Retrieves the HTML skeleton (clean structure) from a given URL by stripping unwanted elements like scripts, styles, and non-essential attributes. This tool keeps only the core HTML structure, links, images, and data attributes for analysis. Supports optional JavaScript rendering for dynamic content and provides chunked output to handle large HTML. This tool is useful for building web scrapers and data extraction tasks where a clean HTML structure is needed for writing concrete selectors or parsers.`,
0 commit comments