apify · vdusek · Oct 29, 2025 · Oct 24, 2025 · Oct 24, 2025 · Oct 29, 2025
diff --git a/pyproject.toml b/pyproject.toml
@@ -36,7 +36,7 @@ keywords = [
 dependencies = [
     "apify-client>=2.2.0,<3.0.0",
     "apify-shared>=2.0.0,<3.0.0",
-    "crawlee>=1.0.2,<2.0.0",
+    "crawlee>=1.0.4,<2.0.0",
     "cachetools>=5.5.0",
     "cryptography>=42.0.0",
     "impit>=0.6.1",

diff --git a/tests/integration/README.md b/tests/integration/README.md
@@ -1,14 +1,25 @@
 # Integration tests
 
-We have integration tests which build and run Actors using the Python SDK on the Apify Platform. To run these tests, you need to set the `APIFY_TEST_USER_API_TOKEN` environment variable to the API token of the Apify user you want to use for the tests, and then start them with `make integration-tests`.
+There are two different groups of integration tests in this repository:
+- Apify API integration tests. These test that the Apify SDK is correctly communicating with Apify API through Apify client.
+- Actor integration tests. These test that the Apify SDK can be used in Actors deployed to Apify platform. These are very high level tests, and they test communication with the API and correct interaction with the Apify platform.
 
-If you want to run the integration tests on a different environment than the main Apify Platform, you need to set the `APIFY_INTEGRATION_TESTS_API_URL` environment variable to the right URL to the Apify API you want to use.
+To run these tests, you need to set the `APIFY_TEST_USER_API_TOKEN` environment variable to the API token of the Apify user you want to use for the tests, and then start them with `make integration-tests`.
 
-## How to write tests
+## Apify API integration tests
+The tests are making real requests to the Apify API as opposed to the unit tests that are mocking such API calls. On the other hand they are faster than `Actor integration tests` as they do not require building and deploying the Actor. These test can be also fully debugged locally. Preferably try to write integration tests on this level if possible.
+
+
+## Actor integration tests
+We have integration tests which build and run Actors using the Python SDK on the Apify platform. These integration tests are slower than `Apify API integration tests` as they need to build and deploy Actors on the platform. Preferably try to write `Apify API integration tests` first, and only write `Actor integration tests` when you need to test something that can only be tested on the platform.
+
+If you want to run the integration tests on a different environment than the main Apify platform, you need to set the `APIFY_INTEGRATION_TESTS_API_URL` environment variable to the right URL to the Apify API you want to use.
+
+### How to write tests
 
 There are two fixtures which you can use to write tests:
 
-### `apify_client_async`
+#### `apify_client_async`
 
 This fixture just gives you an instance of `ApifyClientAsync` configured with the right token and API URL, so you don't have to do that yourself.
 
@@ -17,15 +28,15 @@ async def test_something(apify_client_async: ApifyClientAsync) -> None:
     assert await apify_client_async.user('me').get() is not None
 ```
 
-### `make_actor`
+#### `make_actor`
 
-This fixture returns a factory function for creating Actors on the Apify Platform.
+This fixture returns a factory function for creating Actors on the Apify platform.
 
 For the Actor source, the fixture takes the files from `tests/integration/actor_source_base`, builds the Apify SDK wheel from the current codebase, and adds the Actor source you passed to the fixture as an argument. You have to pass exactly one of the `main_func`, `main_py` and `source_files` arguments.
 
 The created Actor will be uploaded to the platform, built there, and after the test finishes, it will be automatically deleted. If the Actor build fails, it will not be deleted, so that you can check why the build failed.
 
-### Creating test Actor straight from a Python function
+#### Creating test Actor straight from a Python function
 
 You can create Actors straight from a Python function. This is great because you can have the test Actor source code checked with the linter.
 
@@ -66,7 +77,7 @@ async def test_something(
     assert run_result.status == 'SUCCEEDED'
 ```
 
-### Creating Actor from source files
+#### Creating Actor from source files
 
 You can also pass the source files directly if you need something more complex (e.g. pass some fixed value to the Actor source code or use multiple source files).
 
@@ -127,7 +138,7 @@ async def test_something(
     assert actor_run.status == 'SUCCEEDED'
 ```
 
-### Asserts
+#### Asserts
 
 Since test Actors are not executed as standard pytest tests, we don't get introspection of assertion expressions. In case of failure, only a bare `AssertionError` is shown, without the left and right values. This means, we must include explicit assertion messages to aid potential debugging.
 

diff --git a/...gration/actor_source_base/src/__init__.py → tests/integration/actor/__init__.py b/...gration/actor_source_base/src/__init__.py → tests/integration/actor/__init__.py
diff --git a/.../integration/actor_source_base/Dockerfile → ...ration/actor/actor_source_base/Dockerfile b/.../integration/actor_source_base/Dockerfile → ...ration/actor/actor_source_base/Dockerfile
diff --git a/...ration/actor_source_base/requirements.txt → .../actor/actor_source_base/requirements.txt b/...ration/actor_source_base/requirements.txt → .../actor/actor_source_base/requirements.txt
diff --git a/...s/integration/actor_source_base/server.py → ...gration/actor/actor_source_base/server.py b/...s/integration/actor_source_base/server.py → ...gration/actor/actor_source_base/server.py
diff --git a/tests/integration/actor/actor_source_base/src/__init__.py b/tests/integration/actor/actor_source_base/src/__init__.py
diff --git a/...gration/actor_source_base/src/__main__.py → ...n/actor/actor_source_base/src/__main__.py b/...gration/actor_source_base/src/__main__.py → ...n/actor/actor_source_base/src/__main__.py
diff --git a/...integration/actor_source_base/src/main.py → ...ation/actor/actor_source_base/src/main.py b/...integration/actor_source_base/src/main.py → ...ation/actor/actor_source_base/src/main.py
diff --git a/tests/integration/actor/conftest.py b/tests/integration/actor/conftest.py
@@ -0,0 +1,322 @@
+from __future__ import annotations
+
+import base64
+import inspect
+import os
+import subprocess
+import sys
+import textwrap
+from pathlib import Path
+from typing import TYPE_CHECKING, Any, Protocol
+
+import pytest
+from filelock import FileLock
+
+from apify_client import ApifyClient, ApifyClientAsync
+from apify_shared.consts import ActorJobStatus, ActorSourceType
+
+from .._utils import generate_unique_resource_name
+from apify._models import ActorRun
+
+if TYPE_CHECKING:
+    from collections.abc import Awaitable, Callable, Coroutine, Iterator, Mapping
+    from decimal import Decimal
+
+    from apify_client.clients.resource_clients import ActorClientAsync
+
+_TOKEN_ENV_VAR = 'APIFY_TEST_USER_API_TOKEN'
+_API_URL_ENV_VAR = 'APIFY_INTEGRATION_TESTS_API_URL'
+_SDK_ROOT_PATH = Path(__file__).parent.parent.parent.parent.resolve()
+
+
+@pytest.fixture(scope='session')
+def sdk_wheel_path(tmp_path_factory: pytest.TempPathFactory, testrun_uid: str) -> Path:
+    """Build the package wheel if it hasn't been built yet, and return the path to the wheel."""
+    # Make sure the wheel is not being built concurrently across all the pytest-xdist runners,
+    # through locking the building process with a temp file.
+    with FileLock(tmp_path_factory.getbasetemp().parent / 'sdk_wheel_build.lock'):
+        # Make sure the wheel is built exactly once across across all the pytest-xdist runners,
+        # through an indicator file saying that the wheel was already built.
+        was_wheel_built_this_test_run_file = tmp_path_factory.getbasetemp() / f'wheel_was_built_in_run_{testrun_uid}'
+        if not was_wheel_built_this_test_run_file.exists():
+            subprocess.run(
+                args='python -m build',
+                cwd=_SDK_ROOT_PATH,
+                shell=True,
+                check=True,
+                capture_output=True,
+            )
+            was_wheel_built_this_test_run_file.touch()
+
+        # Read the current package version, necessary for getting the right wheel filename.
+        pyproject_toml_file = (_SDK_ROOT_PATH / 'pyproject.toml').read_text(encoding='utf-8')
+        for line in pyproject_toml_file.splitlines():
+            if line.startswith('version = '):
+                delim = '"' if '"' in line else "'"
+                sdk_version = line.split(delim)[1]
+                break
+        else:
+            raise RuntimeError('Unable to find version string.')
+
+        wheel_path = _SDK_ROOT_PATH / 'dist' / f'apify-{sdk_version}-py3-none-any.whl'
+
+        # Just to be sure.
+        assert wheel_path.exists()
+
+        return wheel_path
+
+
+@pytest.fixture(scope='session')
+def actor_base_source_files(sdk_wheel_path: Path) -> dict[str, str | bytes]:
+    """Create a dictionary of the base source files for a testing Actor.
+
+    It takes the files from `tests/integration/actor_source_base`, builds the Apify SDK wheel from
+    the current codebase, and adds them all together in a dictionary.
+    """
+    source_files: dict[str, str | bytes] = {}
+
+    # First read the actor_source_base files
+    actor_source_base_path = _SDK_ROOT_PATH / 'tests/integration/actor/actor_source_base'
+
+    for path in actor_source_base_path.glob('**/*'):
+        if not path.is_file():
+            continue
+        relative_path = str(path.relative_to(actor_source_base_path))
+        try:
+            source_files[relative_path] = path.read_text(encoding='utf-8')
+        except ValueError:
+            source_files[relative_path] = path.read_bytes()
+
+    sdk_wheel_file_name = sdk_wheel_path.name
+    source_files[sdk_wheel_file_name] = sdk_wheel_path.read_bytes()
+
+    source_files['requirements.txt'] = str(source_files['requirements.txt']).replace(
+        'APIFY_SDK_WHEEL_PLACEHOLDER', f'./{sdk_wheel_file_name}'
+    )
+
+    current_major_minor_python_version = '.'.join([str(x) for x in sys.version_info[:2]])
+    integration_tests_python_version = (
+        os.getenv('INTEGRATION_TESTS_PYTHON_VERSION') or current_major_minor_python_version
+    )
+    source_files['Dockerfile'] = str(source_files['Dockerfile']).replace(
+        'BASE_IMAGE_VERSION_PLACEHOLDER', integration_tests_python_version
+    )
+
+    return source_files
+
+
+class MakeActorFunction(Protocol):
+    """A type for the `make_actor` fixture."""
+
+    def __call__(
+        self,
+        label: str,
+        *,
+        main_func: Callable | None = None,
+        main_py: str | None = None,
+        source_files: Mapping[str, str | bytes] | None = None,
+        additional_requirements: list[str] | None = None,
+    ) -> Awaitable[ActorClientAsync]:
+        """Create a temporary Actor from the given main function or source files.
+
+        The Actor will be uploaded to the Apify Platform, built there, and after the test finishes, it will
+        be automatically deleted.
+
+        You have to pass exactly one of the `main_func`, `main_py` and `source_files` arguments.
+
+        Args:
+            label: The label which will be a part of the generated Actor name.
+            main_func: The main function of the Actor.
+            main_py: The `src/main.py` file of the Actor.
+            source_files: A dictionary of the source files of the Actor.
+            additional_requirements: A list of additional requirements to be added to the `requirements.txt`.
+
+        Returns:
+            A resource client for the created Actor.
+        """
+
+
+@pytest.fixture(scope='session')
+def make_actor(
+    actor_base_source_files: dict[str, str | bytes],
+    apify_token: str,
+) -> Iterator[MakeActorFunction]:
+    """Fixture for creating temporary Actors for testing purposes.
+
+    This returns a function that creates a temporary Actor from the given main function or source files. The Actor
+    will be uploaded to the Apify Platform, built there, and after the test finishes, it will be automatically deleted.
+    """
+    actors_for_cleanup: list[str] = []
+
+    async def _make_actor(
+        label: str,
+        *,
+        main_func: Callable | None = None,
+        main_py: str | None = None,
+        source_files: Mapping[str, str | bytes] | None = None,
+        additional_requirements: list[str] | None = None,
+    ) -> ActorClientAsync:
+        if not (main_func or main_py or source_files):
+            raise TypeError('One of `main_func`, `main_py` or `source_files` arguments must be specified')
+
+        if (main_func and main_py) or (main_func and source_files) or (main_py and source_files):
+            raise TypeError('Cannot specify more than one of `main_func`, `main_py` and `source_files` arguments')
+
+        client = ApifyClientAsync(token=apify_token, api_url=os.getenv(_API_URL_ENV_VAR))
+        actor_name = generate_unique_resource_name(label)
+
+        # Get the source of main_func and convert it into a reasonable main_py file.
+        if main_func:
+            func_source = textwrap.dedent(inspect.getsource(main_func))
+            func_source = func_source.replace(f'def {main_func.__name__}(', 'def main(')
+            main_py = '\n'.join(  # noqa: FLY002
+                [
+                    'import asyncio',
+                    '',
+                    'from apify import Actor',
+                    '',
+                    '',
+                    '',
+                    func_source,
+                ]
+            )
+
+        if main_py:
+            source_files = {'src/main.py': main_py}
+
+        assert source_files is not None
+
+        # Copy the source files dict from the fixture so that we're not overwriting it, and merge the passed
+        # argument in it.
+        actor_source_files = actor_base_source_files.copy()
+        actor_source_files.update(source_files)
+
+        if additional_requirements:
+            # Get the current requirements.txt content (as a string).
+            req_content = actor_source_files.get('requirements.txt', '')
+            if isinstance(req_content, bytes):
+                req_content = req_content.decode('utf-8')
+            # Append the additional requirements, each on a new line.
+            additional_reqs = '\n'.join(additional_requirements)
+            req_content = req_content.strip() + '\n' + additional_reqs + '\n'
+            actor_source_files['requirements.txt'] = req_content
+
+        # Reformat the source files in a format that the Apify API understands.
+        source_files_for_api = []
+        for file_name, file_contents in actor_source_files.items():
+            if isinstance(file_contents, str):
+                file_format = 'TEXT'
+                if file_name.endswith('.py'):
+                    file_contents = textwrap.dedent(file_contents).lstrip()  # noqa: PLW2901
+            else:
+                file_format = 'BASE64'
+                file_contents = base64.b64encode(file_contents).decode('utf-8')  # noqa: PLW2901
+
+            source_files_for_api.append(
+                {
+                    'name': file_name,
+                    'format': file_format,
+                    'content': file_contents,
+                }
+            )
+
+        print(f'Creating Actor {actor_name}...')
+        created_actor = await client.actors().create(
+            name=actor_name,
+            default_run_build='latest',
+            default_run_memory_mbytes=256,
+            default_run_timeout_secs=600,
+            versions=[
+                {
+                    'versionNumber': '0.0',
+                    'buildTag': 'latest',
+                    'sourceType': ActorSourceType.SOURCE_FILES,
+                    'sourceFiles': source_files_for_api,
+                }
+            ],
+        )
+
+        actor_client = client.actor(created_actor['id'])
+
+        print(f'Building Actor {actor_name}...')
+        build_result = await actor_client.build(version_number='0.0')
+        build_client = client.build(build_result['id'])
+        build_client_result = await build_client.wait_for_finish(wait_secs=600)
+
+        assert build_client_result is not None
+        assert build_client_result['status'] == ActorJobStatus.SUCCEEDED
+
+        # We only mark the client for cleanup if the build succeeded, so that if something goes wrong here,
+        # you have a chance to check the error.
+        actors_for_cleanup.append(created_actor['id'])
+
+        return actor_client
+
+    yield _make_actor
+
+    # Delete all the generated Actors.
+    for actor_id in actors_for_cleanup:
+        actor_client = ApifyClient(token=apify_token, api_url=os.getenv(_API_URL_ENV_VAR)).actor(actor_id)
+
+        if (actor := actor_client.get()) is not None:
+            actor_client.update(
+                pricing_infos=[
+                    *actor.get('pricingInfos', []),
+                    {
+                        'pricingModel': 'FREE',
+                    },
+                ]
+            )
+
+        actor_client.delete()
+
+
+class RunActorFunction(Protocol):
+    """A type for the `run_actor` fixture."""
+
+    def __call__(
+        self,
+        actor: ActorClientAsync,
+        *,
+        run_input: Any = None,
+        max_total_charge_usd: Decimal | None = None,
+    ) -> Coroutine[None, None, ActorRun]:
+        """Initiate an Actor run and wait for its completion.
+
+        Args:
+            actor: Actor async client, in testing context usually created by `make_actor` fixture.
+            run_input: Optional input for the Actor run.
+
+        Returns:
+            Actor run result.
+        """
+
+
+@pytest.fixture(scope='session')
+def run_actor(apify_client_async: ApifyClientAsync) -> RunActorFunction:
+    """Fixture for calling an Actor run and waiting for its completion.
+
+    This fixture returns a function that initiates an Actor run with optional run input, waits for its completion,
+    and retrieves the final result. It uses the `wait_for_finish` method with a timeout of 10 minutes.
+    """
+
+    async def _run_actor(
+        actor: ActorClientAsync,
+        *,
+        run_input: Any = None,
+        max_total_charge_usd: Decimal | None = None,
+    ) -> ActorRun:
+        call_result = await actor.call(
+            run_input=run_input,
+            max_total_charge_usd=max_total_charge_usd,
+        )
+
+        assert isinstance(call_result, dict), 'The result of ActorClientAsync.call() is not a dictionary.'
+        assert 'id' in call_result, 'The result of ActorClientAsync.call() does not contain an ID.'
+
+        run_client = apify_client_async.run(call_result['id'])
+        run_result = await run_client.wait_for_finish(wait_secs=600)
+
+        return ActorRun.model_validate(run_result)
+
+    return _run_actor