implemented download_image in utils

Linusp · Linusp · commit f08edb4b639a · 2020-07-22T09:49:59.000+08:00
diff --git a/inoreader/utils.py b/inoreader/utils.py
@@ -1,8 +1,11 @@
 # coding: utf-8
 from __future__ import print_function, unicode_literals
 
+import os
 import re
+import shutil
 
+import requests
 from lxml import html
 
 
@@ -35,3 +38,28 @@ def extract_text(html_content):
         link.text = '[%s](%s)' % (text, url)
 
     return content.text_content().replace('\xa0', '').strip()
+
+
+def download_image(url, path, filename, proxies=None):
+    response = requests.get(url, stream=True, proxies=proxies)
+    if response.status_code not in (200, 201):
+        return None
+
+    content_type = response.headers.get('Content-Type', '')
+    if not content_type or not content_type.startswith('image/'):
+        return None
+
+    content_length = int(response.headers.get('Content-Length') or '0')
+    if content_length <= 0:
+        return None
+
+    suffix = content_type.replace('image/', '')
+    if suffix == 'svg+xml':
+        suffix = 'svg'
+
+    image_filename = f'{filename}.{suffix}'
+    with open(os.path.join(path, image_filename), 'wb') as f:
+        response.raw.decode_content = True
+        shutil.copyfileobj(response.raw, f)
+
+    return image_filename