Skip to content

Commit e3b0c1d

Browse files
authored
Merge pull request #69 from scrapy-plugins/fix-default-crawlera-headers
[MRG + 1] Fix default crawlera headers
2 parents e8554a5 + 42ec203 commit e3b0c1d

File tree

5 files changed

+13
-6
lines changed

5 files changed

+13
-6
lines changed

.bumpversion.cfg

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
[bumpversion]
2-
current_version = 1.4.0
2+
current_version = 1.5.0
33
commit = True
44
tag = True
55
tag_name = v{new_version}

scrapy_crawlera/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
from .middleware import CrawleraMiddleware
22

33

4-
__version__ = '1.4.0'
4+
__version__ = '1.5.0'

scrapy_crawlera/middleware.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -231,7 +231,14 @@ def _set_crawlera_default_headers(self, request):
231231
header.decode('utf-8').lower() for header in request.headers
232232
]
233233
if all(h.lower() in lower_case_headers for h in self.conflicting_headers):
234-
logging.warn(
234+
# Send a general warning once, and specific urls if LOG_LEVEL = DEBUG
235+
warnings.warn(
236+
'The headers %s are conflicting on some of your requests. '
237+
'Please check https://doc.scrapinghub.com/crawlera.html '
238+
'for more information. You can set LOG_LEVEL=DEBUG to see the urls with problems'
239+
% str(self.conflicting_headers)
240+
)
241+
logging.debug(
235242
'The headers %s are conflicting on request %s. X-Crawlera-UA '
236243
'will be ignored. Please check https://doc.scrapinghub.com/cr'
237244
'awlera.html for more information'

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66

77
setup(
88
name='scrapy-crawlera',
9-
version='1.4.0',
9+
version='1.5.0',
1010
license='BSD',
1111
description='Crawlera middleware for Scrapy',
1212
long_description=readme,

tests/test_crawlera.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -434,7 +434,7 @@ def test_crawlera_default_headers_conflicting_headers(self, mock_logger):
434434
assert mw.process_request(req, spider) is None
435435
self.assertEqual(req.headers['X-Crawlera-UA'], b'desktop')
436436
self.assertEqual(req.headers['X-Crawlera-Profile'], b'desktop')
437-
mock_logger.warn.assert_called_with(
437+
mock_logger.debug.assert_called_with(
438438
"The headers ('X-Crawlera-Profile', 'X-Crawlera-UA') are conflictin"
439439
"g on request http://www.scrapytest.org/other. X-Crawlera-UA will b"
440440
"e ignored. Please check https://doc.scrapinghub.com/crawlera.html "
@@ -447,7 +447,7 @@ def test_crawlera_default_headers_conflicting_headers(self, mock_logger):
447447
assert mw.process_request(req, spider) is None
448448
self.assertEqual(req.headers['X-Crawlera-UA'], b'desktop')
449449
self.assertEqual(req.headers['X-Crawlera-Profile'], b'desktop')
450-
mock_logger.warn.assert_called_with(
450+
mock_logger.debug.assert_called_with(
451451
"The headers ('X-Crawlera-Profile', 'X-Crawlera-UA') are conflictin"
452452
"g on request http://www.scrapytest.org/other. X-Crawlera-UA will b"
453453
"e ignored. Please check https://doc.scrapinghub.com/crawlera.html "

0 commit comments

Comments
 (0)