apify · vdusek · Sep 3, 2025 · Sep 2, 2025 · Sep 2, 2025 · Sep 3, 2025
diff --git a/docs/03_concepts/01_actor_lifecycle.mdx → docs/02_concepts/01_actor_lifecycle.mdx b/docs/03_concepts/01_actor_lifecycle.mdx → docs/02_concepts/01_actor_lifecycle.mdx
diff --git a/docs/03_concepts/02_actor_input.mdx → docs/02_concepts/02_actor_input.mdx b/docs/03_concepts/02_actor_input.mdx → docs/02_concepts/02_actor_input.mdx
diff --git a/docs/03_concepts/03_storages.mdx → docs/02_concepts/03_storages.mdx b/docs/03_concepts/03_storages.mdx → docs/02_concepts/03_storages.mdx
diff --git a/docs/03_concepts/04_actor_events.mdx → docs/02_concepts/04_actor_events.mdx b/docs/03_concepts/04_actor_events.mdx → docs/02_concepts/04_actor_events.mdx
diff --git a/docs/03_concepts/05_proxy_management.mdx → docs/02_concepts/05_proxy_management.mdx b/docs/03_concepts/05_proxy_management.mdx → docs/02_concepts/05_proxy_management.mdx
diff --git a/...epts/06_interacting_with_other_actors.mdx → ...epts/06_interacting_with_other_actors.mdx b/...epts/06_interacting_with_other_actors.mdx → ...epts/06_interacting_with_other_actors.mdx
diff --git a/docs/03_concepts/07_webhooks.mdx → docs/02_concepts/07_webhooks.mdx b/docs/03_concepts/07_webhooks.mdx → docs/02_concepts/07_webhooks.mdx
diff --git a/docs/03_concepts/08_access_apify_api.mdx → docs/02_concepts/08_access_apify_api.mdx b/docs/03_concepts/08_access_apify_api.mdx → docs/02_concepts/08_access_apify_api.mdx
diff --git a/docs/03_concepts/09_running_webserver.mdx → docs/02_concepts/09_running_webserver.mdx b/docs/03_concepts/09_running_webserver.mdx → docs/02_concepts/09_running_webserver.mdx
diff --git a/docs/03_concepts/10_logging.mdx → docs/02_concepts/10_logging.mdx b/docs/03_concepts/10_logging.mdx → docs/02_concepts/10_logging.mdx
diff --git a/docs/03_concepts/11_configuration.mdx → docs/02_concepts/11_configuration.mdx b/docs/03_concepts/11_configuration.mdx → docs/02_concepts/11_configuration.mdx
diff --git a/docs/03_concepts/12_pay_per_event.mdx → docs/02_concepts/12_pay_per_event.mdx b/docs/03_concepts/12_pay_per_event.mdx → docs/02_concepts/12_pay_per_event.mdx
diff --git a/docs/03_concepts/code/01_context_manager.py → docs/02_concepts/code/01_context_manager.py b/docs/03_concepts/code/01_context_manager.py → docs/02_concepts/code/01_context_manager.py
diff --git a/docs/03_concepts/code/01_init_exit.py → docs/02_concepts/code/01_init_exit.py b/docs/03_concepts/code/01_init_exit.py → docs/02_concepts/code/01_init_exit.py
diff --git a/docs/03_concepts/code/01_reboot.py → docs/02_concepts/code/01_reboot.py b/docs/03_concepts/code/01_reboot.py → docs/02_concepts/code/01_reboot.py
diff --git a/docs/03_concepts/code/01_status_message.py → docs/02_concepts/code/01_status_message.py b/docs/03_concepts/code/01_status_message.py → docs/02_concepts/code/01_status_message.py
diff --git a/docs/03_concepts/code/02_input.py → docs/02_concepts/code/02_input.py b/docs/03_concepts/code/02_input.py → docs/02_concepts/code/02_input.py
diff --git a/docs/03_concepts/code/03_dataset_exports.py → docs/02_concepts/code/03_dataset_exports.py b/docs/03_concepts/code/03_dataset_exports.py → docs/02_concepts/code/03_dataset_exports.py
diff --git a/...03_concepts/code/03_dataset_read_write.py → ...02_concepts/code/03_dataset_read_write.py b/...03_concepts/code/03_dataset_read_write.py → ...02_concepts/code/03_dataset_read_write.py
diff --git a/.../03_concepts/code/03_deleting_storages.py → .../02_concepts/code/03_deleting_storages.py b/.../03_concepts/code/03_deleting_storages.py → .../02_concepts/code/03_deleting_storages.py
diff --git a/docs/03_concepts/code/03_kvs_iterating.py → docs/02_concepts/code/03_kvs_iterating.py b/docs/03_concepts/code/03_kvs_iterating.py → docs/02_concepts/code/03_kvs_iterating.py
diff --git a/docs/03_concepts/code/03_kvs_public_url.py → docs/02_concepts/code/03_kvs_public_url.py b/docs/03_concepts/code/03_kvs_public_url.py → docs/02_concepts/code/03_kvs_public_url.py
diff --git a/docs/03_concepts/code/03_kvs_read_write.py → docs/02_concepts/code/03_kvs_read_write.py b/docs/03_concepts/code/03_kvs_read_write.py → docs/02_concepts/code/03_kvs_read_write.py
diff --git a/docs/03_concepts/code/03_opening_storages.py → docs/02_concepts/code/03_opening_storages.py b/docs/03_concepts/code/03_opening_storages.py → docs/02_concepts/code/03_opening_storages.py
diff --git a/docs/03_concepts/code/03_rq.py → docs/02_concepts/code/03_rq.py b/docs/03_concepts/code/03_rq.py → docs/02_concepts/code/03_rq.py
diff --git a/docs/03_concepts/code/04_actor_events.py → docs/02_concepts/code/04_actor_events.py b/docs/03_concepts/code/04_actor_events.py → docs/02_concepts/code/04_actor_events.py
diff --git a/docs/03_concepts/code/05_apify_proxy.py → docs/02_concepts/code/05_apify_proxy.py b/docs/03_concepts/code/05_apify_proxy.py → docs/02_concepts/code/05_apify_proxy.py
diff --git a/...03_concepts/code/05_apify_proxy_config.py → ...02_concepts/code/05_apify_proxy_config.py b/...03_concepts/code/05_apify_proxy_config.py → ...02_concepts/code/05_apify_proxy_config.py
diff --git a/docs/03_concepts/code/05_custom_proxy.py → docs/02_concepts/code/05_custom_proxy.py b/docs/03_concepts/code/05_custom_proxy.py → docs/02_concepts/code/05_custom_proxy.py
diff --git a/...concepts/code/05_custom_proxy_function.py → ...concepts/code/05_custom_proxy_function.py b/...concepts/code/05_custom_proxy_function.py → ...concepts/code/05_custom_proxy_function.py
diff --git a/.../03_concepts/code/05_proxy_actor_input.py → .../02_concepts/code/05_proxy_actor_input.py b/.../03_concepts/code/05_proxy_actor_input.py → .../02_concepts/code/05_proxy_actor_input.py
diff --git a/docs/03_concepts/code/05_proxy_httpx.py → docs/02_concepts/code/05_proxy_httpx.py b/docs/03_concepts/code/05_proxy_httpx.py → docs/02_concepts/code/05_proxy_httpx.py
diff --git a/docs/03_concepts/code/05_proxy_rotation.py → docs/02_concepts/code/05_proxy_rotation.py b/docs/03_concepts/code/05_proxy_rotation.py → docs/02_concepts/code/05_proxy_rotation.py
diff --git a/docs/03_concepts/code/06_interacting_call.py → docs/02_concepts/code/06_interacting_call.py b/docs/03_concepts/code/06_interacting_call.py → docs/02_concepts/code/06_interacting_call.py
diff --git a/...concepts/code/06_interacting_call_task.py → ...concepts/code/06_interacting_call_task.py b/...concepts/code/06_interacting_call_task.py → ...concepts/code/06_interacting_call_task.py
diff --git a/...concepts/code/06_interacting_metamorph.py → ...concepts/code/06_interacting_metamorph.py b/...concepts/code/06_interacting_metamorph.py → ...concepts/code/06_interacting_metamorph.py
diff --git a/.../03_concepts/code/06_interacting_start.py → .../02_concepts/code/06_interacting_start.py b/.../03_concepts/code/06_interacting_start.py → .../02_concepts/code/06_interacting_start.py
diff --git a/docs/03_concepts/code/07_webhook.py → docs/02_concepts/code/07_webhook.py b/docs/03_concepts/code/07_webhook.py → docs/02_concepts/code/07_webhook.py
diff --git a/...03_concepts/code/07_webhook_preventing.py → ...02_concepts/code/07_webhook_preventing.py b/...03_concepts/code/07_webhook_preventing.py → ...02_concepts/code/07_webhook_preventing.py
diff --git a/docs/03_concepts/code/08_actor_client.py → docs/02_concepts/code/08_actor_client.py b/docs/03_concepts/code/08_actor_client.py → docs/02_concepts/code/08_actor_client.py
diff --git a/docs/03_concepts/code/08_actor_new_client.py → docs/02_concepts/code/08_actor_new_client.py b/docs/03_concepts/code/08_actor_new_client.py → docs/02_concepts/code/08_actor_new_client.py
diff --git a/docs/03_concepts/code/09_webserver.py → docs/02_concepts/code/09_webserver.py b/docs/03_concepts/code/09_webserver.py → docs/02_concepts/code/09_webserver.py
diff --git a/docs/03_concepts/code/10_log_config.py → docs/02_concepts/code/10_log_config.py b/docs/03_concepts/code/10_log_config.py → docs/02_concepts/code/10_log_config.py
diff --git a/docs/03_concepts/code/10_logger_usage.py → docs/02_concepts/code/10_logger_usage.py b/docs/03_concepts/code/10_logger_usage.py → docs/02_concepts/code/10_logger_usage.py
diff --git a/docs/03_concepts/code/10_redirect_log.py → docs/02_concepts/code/10_redirect_log.py b/docs/03_concepts/code/10_redirect_log.py → docs/02_concepts/code/10_redirect_log.py
diff --git a/...epts/code/10_redirect_log_existing_run.py → ...epts/code/10_redirect_log_existing_run.py b/...epts/code/10_redirect_log_existing_run.py → ...epts/code/10_redirect_log_existing_run.py
diff --git a/docs/03_concepts/code/11_config.py → docs/02_concepts/code/11_config.py b/docs/03_concepts/code/11_config.py → docs/02_concepts/code/11_config.py
diff --git a/docs/03_concepts/code/actor_charge.py → docs/02_concepts/code/actor_charge.py b/docs/03_concepts/code/actor_charge.py → docs/02_concepts/code/actor_charge.py
diff --git a/...concepts/code/conditional_actor_charge.py → ...concepts/code/conditional_actor_charge.py b/...concepts/code/conditional_actor_charge.py → ...concepts/code/conditional_actor_charge.py
diff --git a/docs/02_guides/01_beautifulsoup_httpx.mdx b/docs/02_guides/01_beautifulsoup_httpx.mdx
diff --git a/docs/02_guides/02_crawlee.mdx b/docs/02_guides/02_crawlee.mdx
diff --git a/docs/03_guides/01_beautifulsoup_httpx.mdx b/docs/03_guides/01_beautifulsoup_httpx.mdx
@@ -0,0 +1,30 @@
+---
+id: beautifulsoup-httpx
+title: Using BeautifulSoup with HTTPX
+---
+
+import CodeBlock from '@theme/CodeBlock';
+
+import BeautifulSoupHttpxExample from '!!raw-loader!./code/01_beautifulsoup_httpx.py';
+
+In this guide, you'll learn how to use the [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/) library with the [HTTPX](https://www.python-httpx.org/) library in your Apify Actors.
+
+## Introduction
+
+[BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/) is a Python library for extracting data from HTML and XML files. It provides simple methods and Pythonic idioms for navigating, searching, and modifying a website's element tree, enabling efficient data extraction.
+
+[HTTPX](https://www.python-httpx.org/) is a modern, high-level HTTP client library for Python. It provides a simple interface for making HTTP requests and supports both synchronous and asynchronous requests.
+
+To create an Actor which uses those libraries, start from the [BeautifulSoup & Python](https://apify.com/templates/categories/python) Actor template. This template includes the [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/) and [HTTPX](https://www.python-httpx.org/) libraries preinstalled, allowing you to begin development immediately.
+
+## Example Actor
+
+Below is a simple Actor that recursively scrapes titles from all linked websites, up to a specified maximum depth, starting from URLs provided in the Actor input. It uses [HTTPX](https://www.python-httpx.org/) for fetching pages and [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/) for parsing their content to extract titles and links to other pages.
+
+<CodeBlock className="language-python">
+    {BeautifulSoupHttpxExample}
+</CodeBlock>
+
+## Conclusion
+
+In this guide, you learned how to use the [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/) with the [HTTPX](https://www.python-httpx.org/) in your Apify Actors. By combining these libraries, you can efficiently extract data from HTML or XML files, making it easy to build web scraping tasks in Python. See the [Actor templates](https://apify.com/templates/categories/python) to get started with your own scraping tasks. If you have questions or need assistance, feel free to reach out on our [GitHub](https://github.com/apify/apify-sdk-python) or join our [Discord community](https://discord.com/invite/jyEM2PRvMU). Happy scraping!
diff --git a/docs/03_guides/02_parsel_impit.mdx b/docs/03_guides/02_parsel_impit.mdx
@@ -0,0 +1,28 @@
+---
+id: parsel-impit
+title: Using Parsel with Impit
+---
+
+import CodeBlock from '@theme/CodeBlock';
+
+import ParselImpitExample from '!!raw-loader!./code/02_parsel_impit.py';
+
+In this guide, you'll learn how to combine the [Parsel](https://github.com/scrapy/parsel) and [Impit](https://github.com/apify/impit) libraries when building Apify Actors.
+
+## Introduction
+
+[Parsel](https://github.com/scrapy/parsel) is a Python library for extracting data from HTML and XML documents using CSS selectors and [XPath](https://en.wikipedia.org/wiki/XPath) expressions. It offers an intuitive API for navigating and extracting structured data, making it a popular choice for web scraping. Compared to [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/), it also delivers better performance.
+
+[Impit](https://github.com/apify/impit) is Apify's high-performance HTTP client for Python. It supports both synchronous and asynchronous workflows and is built for large-scale web scraping, where making thousands of requests efficiently is essential. With built-in browser impersonation and anti-blocking features, it simplifies handling modern websites.
+
+## Example Actor
+
+The following example shows a simple Actor that recursively scrapes titles from linked pages, up to a user-defined maximum depth. It uses [Impit](https://github.com/apify/impit) to fetch pages and [Parsel](https://github.com/scrapy/parsel) to extract titles and discover new links.
+
+<CodeBlock className="language-python">
+    {ParselImpitExample}
+</CodeBlock>
+
+## Conclusion
+
+In this guide, you learned how to use [Parsel](https://github.com/scrapy/parsel) with [Impit](https://github.com/apify/impit) in your Apify Actors. By combining these libraries, you get a powerful and efficient solution for web scraping: [Parsel](https://github.com/scrapy/parsel) provides excellent CSS selector and XPath support for data extraction, while [Impit](https://github.com/apify/impit) offers a fast and simple HTTP client built by Apify. This combination makes it easy to build scalable web scraping tasks in Python. See the [Actor templates](https://apify.com/templates/categories/python) to get started with your own scraping tasks. If you have questions or need assistance, feel free to reach out on our [GitHub](https://github.com/apify/apify-sdk-python) or join our [Discord community](https://discord.com/invite/jyEM2PRvMU). Happy scraping!
diff --git a/docs/02_guides/03_playwright.mdx → docs/03_guides/03_playwright.mdx b/docs/02_guides/03_playwright.mdx → docs/03_guides/03_playwright.mdx
diff --git a/docs/02_guides/04_selenium.mdx → docs/03_guides/04_selenium.mdx b/docs/02_guides/04_selenium.mdx → docs/03_guides/04_selenium.mdx
diff --git a/docs/03_guides/05_crawlee.mdx b/docs/03_guides/05_crawlee.mdx
@@ -0,0 +1,46 @@
+---
+id: crawlee
+title: Using Crawlee
+---
+
+import CodeBlock from '@theme/CodeBlock';
+
+import CrawleeBeautifulSoupExample from '!!raw-loader!./code/05_crawlee_beautifulsoup.py';
+import CrawleeParselExample from '!!raw-loader!./code/05_crawlee_parsel.py';
+import CrawleePlaywrightExample from '!!raw-loader!./code/05_crawlee_playwright.py';
+
+In this guide you'll learn how to use the [Crawlee](https://crawlee.dev/python) library in your Apify Actors.
+
+## Introduction
+
+[Crawlee](https://crawlee.dev/python) is a Python library for web scraping and browser automation that provides a robust and flexible framework for building web scraping tasks. It seamlessly integrates with the Apify platform and supports a variety of scraping techniques, from static HTML parsing to dynamic JavaScript-rendered content handling. Crawlee offers a range of crawlers, including HTTP-based crawlers like [`HttpCrawler`](https://crawlee.dev/python/api/class/HttpCrawler), [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler) and [`ParselCrawler`](https://crawlee.dev/python/api/class/ParselCrawler), and browser-based crawlers like [`PlaywrightCrawler`](https://crawlee.dev/python/api/class/PlaywrightCrawler), to suit different scraping needs.
+
+In this guide, you'll learn how to use Crawlee with [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler), [`ParselCrawler`](https://crawlee.dev/python/api/class/ParselCrawler), and [`PlaywrightCrawler`](https://crawlee.dev/python/api/class/PlaywrightCrawler) to build Apify Actors for web scraping.
+
+## Actor with BeautifulSoupCrawler
+
+The [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler) is ideal for extracting data from static HTML pages. It uses [BeautifulSoup](https://www.crummy.com/software/BeautifulSoup/bs4/doc/) for parsing and [`ImpitHttpClient`](https://crawlee.dev/python/api/class/ImpitHttpClient) for HTTP communication, ensuring efficient and lightweight scraping. If you do not need to execute JavaScript on the page, [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler) is a great choice for your scraping tasks. Below is an example of how to use it` in an Apify Actor.
+
+<CodeBlock className="language-python">
+    {CrawleeBeautifulSoupExample}
+</CodeBlock>
+
+## Actor with ParselCrawler
+
+The [`ParselCrawler`](https://crawlee.dev/python/api/class/ParselCrawler) works in the same way as [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler), but it uses the [Parsel](https://parsel.readthedocs.io/en/latest/) library for HTML parsing. This allows for more powerful and flexible data extraction using [XPath](https://en.wikipedia.org/wiki/XPath) selectors. It should be faster than [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler). Below is an example of how to use [`ParselCrawler`](https://crawlee.dev/python/api/class/ParselCrawler) in an Apify Actor.
+
+<CodeBlock className="language-python">
+    {CrawleeParselExample}
+</CodeBlock>
+
+## Actor with PlaywrightCrawler
+
+The [`PlaywrightCrawler`](https://crawlee.dev/python/api/class/PlaywrightCrawler) is built for handling dynamic web pages that rely on JavaScript for content generation. Using the [Playwright](https://playwright.dev/) library, it provides a browser-based automation environment to interact with complex websites. Below is an example of how to use [`PlaywrightCrawler`](https://crawlee.dev/python/api/class/PlaywrightCrawler) in an Apify Actor.
+
+<CodeBlock className="language-python">
+    {CrawleePlaywrightExample}
+</CodeBlock>
+
+## Conclusion
+
+In this guide, you learned how to use the [Crawlee](https://crawlee.dev/python) library in your Apify Actors. By using the [`BeautifulSoupCrawler`](https://crawlee.dev/python/api/class/BeautifulSoupCrawler), [`ParselCrawler`](https://crawlee.dev/python/api/class/ParselCrawler), and [`PlaywrightCrawler`](https://crawlee.dev/python/api/class/PlaywrightCrawler) crawlers, you can efficiently scrape static or dynamic web pages, making it easy to build web scraping tasks in Python. See the [Actor templates](https://apify.com/templates/categories/python) to get started with your own scraping tasks. If you have questions or need assistance, feel free to reach out on our [GitHub](https://github.com/apify/apify-sdk-python) or join our [Discord community](https://discord.com/invite/jyEM2PRvMU). Happy scraping!
diff --git a/docs/02_guides/05_scrapy.mdx → docs/03_guides/06_scrapy.mdx b/docs/02_guides/05_scrapy.mdx → docs/03_guides/06_scrapy.mdx
diff --git a/.../02_guides/code/01_beautifulsoup_httpx.py → .../03_guides/code/01_beautifulsoup_httpx.py b/.../02_guides/code/01_beautifulsoup_httpx.py → .../03_guides/code/01_beautifulsoup_httpx.py
@@ -1,9 +1,7 @@
-from __future__ import annotations
-
 from urllib.parse import urljoin
 
+import httpx
 from bs4 import BeautifulSoup
-from httpx import AsyncClient
 
 from apify import Actor, Request
 
@@ -32,7 +30,7 @@ async def main() -> None:
             await request_queue.add_request(new_request)
 
         # Create an HTTPX client to fetch the HTML content of the URLs.
-        async with AsyncClient() as client:
+        async with httpx.AsyncClient() as client:
             # Process the URLs from the request queue.
             while request := await request_queue.fetch_next_request():
                 url = request.url

diff --git a/docs/03_guides/code/02_parsel_impit.py b/docs/03_guides/code/02_parsel_impit.py
@@ -0,0 +1,89 @@
+from urllib.parse import urljoin
+
+import impit
+import parsel
+
+from apify import Actor, Request
+
+
+async def main() -> None:
+    # Enter the context of the Actor.
+    async with Actor:
+        # Retrieve the Actor input, and use default values if not provided.
+        actor_input = await Actor.get_input() or {}
+        start_urls = actor_input.get('start_urls', [{'url': 'https://apify.com'}])
+        max_depth = actor_input.get('max_depth', 1)
+
+        # Exit if no start URLs are provided.
+        if not start_urls:
+            Actor.log.info('No start URLs specified in Actor input, exiting...')
+            await Actor.exit()
+
+        # Open the default request queue for handling URLs to be processed.
+        request_queue = await Actor.open_request_queue()
+
+        # Enqueue the start URLs with an initial crawl depth of 0.
+        for start_url in start_urls:
+            url = start_url.get('url')
+            Actor.log.info(f'Enqueuing {url} ...')
+            new_request = Request.from_url(url, user_data={'depth': 0})
+            await request_queue.add_request(new_request)
+
+        # Create an Impit client to fetch the HTML content of the URLs.
+        async with impit.AsyncClient() as client:
+            # Process the URLs from the request queue.
+            while request := await request_queue.fetch_next_request():
+                url = request.url
+
+                if not isinstance(request.user_data['depth'], (str, int)):
+                    raise TypeError('Request.depth is an unexpected type.')
+
+                depth = int(request.user_data['depth'])
+                Actor.log.info(f'Scraping {url} (depth={depth}) ...')
+
+                try:
+                    # Fetch the HTTP response from the specified URL using Impit.
+                    response = await client.get(url)
+
+                    # Parse the HTML content using Parsel Selector.
+                    selector = parsel.Selector(text=response.text)
+
+                    # If the current depth is less than max_depth, find nested links
+                    # and enqueue them.
+                    if depth < max_depth:
+                        # Extract all links using CSS selector
+                        links = selector.css('a::attr(href)').getall()
+                        for link_href in links:
+                            link_url = urljoin(url, link_href)
+
+                            if link_url.startswith(('http://', 'https://')):
+                                Actor.log.info(f'Enqueuing {link_url} ...')
+                                new_request = Request.from_url(
+                                    link_url,
+                                    user_data={'depth': depth + 1},
+                                )
+                                await request_queue.add_request(new_request)
+
+                    # Extract the desired data using Parsel selectors.
+                    title = selector.css('title::text').get()
+                    h1s = selector.css('h1::text').getall()
+                    h2s = selector.css('h2::text').getall()
+                    h3s = selector.css('h3::text').getall()
+
+                    data = {
+                        'url': url,
+                        'title': title,
+                        'h1s': h1s,
+                        'h2s': h2s,
+                        'h3s': h3s,
+                    }
+
+                    # Store the extracted data to the default dataset.
+                    await Actor.push_data(data)
+
+                except Exception:
+                    Actor.log.exception(f'Cannot extract data from {url}.')
+
+                finally:
+                    # Mark the request as handled to ensure it is not processed again.
+                    await request_queue.mark_request_as_handled(request)
diff --git a/docs/02_guides/code/03_playwright.py → docs/03_guides/code/03_playwright.py b/docs/02_guides/code/03_playwright.py → docs/03_guides/code/03_playwright.py
@@ -1,5 +1,3 @@
-from __future__ import annotations
-
 from urllib.parse import urljoin
 
 from playwright.async_api import async_playwright

diff --git a/docs/02_guides/code/04_selenium.py → docs/03_guides/code/04_selenium.py b/docs/02_guides/code/04_selenium.py → docs/03_guides/code/04_selenium.py
@@ -1,5 +1,3 @@
-from __future__ import annotations
-
 import asyncio
 from urllib.parse import urljoin
 

diff --git a/...2_guides/code/02_crawlee_beautifulsoup.py → ...3_guides/code/05_crawlee_beautifulsoup.py b/...2_guides/code/02_crawlee_beautifulsoup.py → ...3_guides/code/05_crawlee_beautifulsoup.py
@@ -1,5 +1,3 @@
-from __future__ import annotations
-
 from crawlee.crawlers import BeautifulSoupCrawler, BeautifulSoupCrawlingContext
 
 from apify import Actor