Without debug

Pijukatel · Pijukatel · commit dde4b46d770f · 2025-08-12T13:51:55.000+02:00
diff --git a/src/apify/storage_clients/_apify/_request_queue_client.py b/src/apify/storage_clients/_apify/_request_queue_client.py
@@ -26,7 +26,6 @@
 
 logger = getLogger(__name__)
 
-COUNTER = iter(range(10000))
 
 class ApifyRequestQueueClient(RequestQueueClient):
     """An Apify platform implementation of the request queue client."""
@@ -295,25 +294,18 @@ async def fetch_next_request(self) -> Request | None:
         Returns:
             The request or `None` if there are no more pending requests.
         """
-        call_time = next(COUNTER)
         # Ensure the queue head has requests if available. Fetching the head with lock to prevent race conditions.
-        logger.debug(f'Before _fetch_lock, {call_time}')
         async with self._fetch_lock:
-            logger.debug(f'Fetching, {call_time}')
             await self._ensure_head_is_non_empty()
 
             # If queue head is empty after ensuring, there are no requests
             if not self._queue_head:
-                logger.debug(f'Empty, {call_time}')
                 return None
 
             # Get the next request ID from the queue head
             next_request_id = self._queue_head.popleft()
-            logger.debug(f'New request, {call_time}')
 
-        logger.debug(f'Before hydrate, {call_time}')
         request = await self._get_or_hydrate_request(next_request_id)
-        logger.debug(f'After hydrate, {call_time}')
 
         # Handle potential inconsistency where request might not be in the main table yet
         if request is None:
@@ -331,16 +323,6 @@ async def fetch_next_request(self) -> Request | None:
             )
             return None
 
-        # Use get request to ensure we have the full request object.
-        #request = await self.get_request(request.id) This seems redundant
-        if request is None:
-            logger.debug(
-                'Request fetched from the beginning of queue was not found in the RQ',
-                extra={'nextRequestId': next_request_id},
-            )
-            return None
-
-        logger.debug(f'{request.retry_count=}, {call_time}')
         return request
 
     @override
@@ -403,16 +385,13 @@ async def reclaim_request(
         """
         # Check if the request was marked as handled and clear it. When reclaiming,
         # we want to put the request back for processing.
-        call_time = next(COUNTER)
         if request.was_already_handled:
             request.handled_at = None
 
         async with self._fetch_lock:
             try:
                 # Update the request in the API.
-                logger.debug(f'Before _update_request reclaiming, {call_time}')
                 processed_request = await self._update_request(request, forefront=forefront)
-                logger.debug(f'After _update_request reclaiming, {call_time}')
                 processed_request.unique_key = request.unique_key
 
                 # If the request was previously handled, decrement our handled count since
@@ -435,9 +414,7 @@ async def reclaim_request(
 
                 # Try to release the lock on the request
                 try:
-                    logger.debug(f'Before _delete_request_lock reclaiming, {call_time}')
                     await self._delete_request_lock(request.id, forefront=forefront)
-                    logger.debug(f'After _delete_request_lock reclaiming, {call_time}')
                 except Exception as err:
                     logger.debug(f'Failed to delete request lock for request {request.id}', exc_info=err)
             except Exception as exc:
@@ -453,13 +430,8 @@ async def is_empty(self) -> bool:
         Returns:
             True if the queue is empty, False otherwise.
         """
-        call_time = next(COUNTER)
-        logger.debug(f'Before _list_head is_empty, {call_time}')
         async with self._fetch_lock:
-            logger.debug(f'During _list_head is_empty, {call_time}')
             head = await self._list_head(limit=1, lock_time=None)
-            logger.debug(f'After _list_head is_empty, {call_time}')
-            logger.debug(f'Finish _list_head is_empty, {call_time}')
             return len(head.items) == 0 and not self._queue_has_locked_requests
 
     async def _ensure_head_is_non_empty(self) -> None:
@@ -571,10 +543,7 @@ async def _list_head(
             A collection of requests from the beginning of the queue.
         """
         # Return from cache if available and we're not checking for new forefront requests
-        call_time = next(COUNTER)
         if self._queue_head and not self._should_check_for_forefront_requests:
-            logger.debug(f'Using cached queue head with {len(self._queue_head)} requests, {call_time}')
-
             # Create a list of requests from the cached queue head
             items = []
             for request_id in list(self._queue_head)[:limit]:
@@ -592,7 +561,6 @@ async def _list_head(
                 queue_has_locked_requests=self._queue_has_locked_requests,
                 lock_time=lock_time,
             )
-        logger.debug(f'Updating cached queue head with {len(self._queue_head)} requests, {call_time}')
         leftover_buffer = list[str]()
         if self._should_check_for_forefront_requests:
             leftover_buffer = list(self._queue_head)
@@ -636,14 +604,11 @@ async def _list_head(
                 ),
                 hydrated_request=request,
             )
-            logger.debug(f'Adding to head, {call_time}')
             self._queue_head.append(request.id)
-        logger.debug(f'Cached queue head with {len(self._queue_head)} requests, {call_time}')
 
         for leftover_request_id in leftover_buffer:
             # After adding new requests to the forefront, any existing leftover locked request is kept in the end.
             self._queue_head.append(leftover_request_id)
-        logger.debug(f'Cached queue head with {len(self._queue_head)} requests, {call_time}')
         return RequestQueueHead.model_validate(response)
 
     async def _prolong_request_lock(
diff --git a/tests/integration/test_actor_request_queue.py b/tests/integration/test_actor_request_queue.py
@@ -113,25 +113,3 @@ async def test_request_queue_is_finished(
             assert await request_queue.is_finished()
         finally:
             await request_queue.drop()
-
-
-async def test_same_request_fetched_twice(
-    apify_client_async: ApifyClientAsync,
-    monkeypatch: pytest.MonkeyPatch):
-    """Test that the same request can be fetched twice from the request queue."""
-    monkeypatch.setenv(ApifyEnvVars.TOKEN, apify_client_async.token)
-
-    request_queue_name = generate_unique_resource_name('request_queue')
-    async with Actor:
-        try:
-            request_queue = await Actor.open_request_queue(name='same-request-fetch', force_cloud=request_queue_name)
-
-            request = Request.from_url('http://example.com')
-            await request_queue.add_request(request)
-
-            fetched_request_1 = await request_queue.fetch_next_request()
-            assert fetched_request_1 is not None
-            assert fetched_request_1.url == 'http://example.com'
-            await request_queue.reclaim_request(fetched_request_1)
-        finally:
-            await request_queue.drop()
diff --git a/tests/integration/test_crawlers_with_storages.py b/tests/integration/test_crawlers_with_storages.py
@@ -2,8 +2,6 @@
 
 from typing import TYPE_CHECKING
 
-import pytest
-
 if TYPE_CHECKING:
     from .conftest import MakeActorFunction, RunActorFunction
 
@@ -78,23 +76,20 @@ async def default_handler(context: ParselCrawlingContext) -> None:
     assert run_result.status == 'SUCCEEDED'
 
 
-@pytest.mark.parametrize('_', range(10))
-async def test_actor_on_platform_max_request_retries(_,
+async def test_actor_on_platform_max_request_retries(
     make_actor: MakeActorFunction,
     run_actor: RunActorFunction,
 ) -> None:
     """Test that the actor respects max_request_retries."""
 
     async def main() -> None:
         """The crawler entry point."""
-        import logging
 
         from crawlee.crawlers import BasicCrawlingContext, ParselCrawler, ParselCrawlingContext
 
         from apify import Actor
 
         async with Actor:
-            logging.getLogger('apify.storage_clients._apify._request_queue_client').setLevel(logging.DEBUG)
             max_retries = 3
             crawler = ParselCrawler(max_request_retries=max_retries)
             failed_counter = 0