77BASE_URL = "https://www.bing.com/images/search?"
88
99
10- def gen_query_url (keywords , filters , extra_query_params = '' ):
10+ def gen_query_url (keywords , filters , extra_query_params = '' ):
1111 keywords_str = "&q=" + quote (keywords )
1212 query_url = BASE_URL + keywords_str
1313 if len (filters ) > 0 :
@@ -44,7 +44,7 @@ def image_url_from_webpage(driver, max_number=10000):
4444 return image_urls
4545
4646
47- def crawl_image_urls (keywords , filters , max_number = 10000 , proxy = None , proxy_type = "http" , extra_query_params = '' ):
47+ def crawl_image_urls (keywords , filters , max_number = 10000 , proxy = None , proxy_type = "http" , extra_query_params = '' ):
4848 chrome_path = shutil .which ("chromedriver" )
4949 chrome_path = "./bin/chromedriver" if chrome_path is None else chrome_path
5050 chrome_options = webdriver .ChromeOptions ()
@@ -53,7 +53,7 @@ def crawl_image_urls(keywords, filters, max_number=10000, proxy=None, proxy_type
5353 "--proxy-server={}://{}" .format (proxy_type , proxy ))
5454 driver = webdriver .Chrome (chrome_path , chrome_options = chrome_options )
5555
56- query_url = gen_query_url (keywords , filters , extra_query_params )
56+ query_url = gen_query_url (keywords , filters , extra_query_params = extra_query_params )
5757 driver .set_window_size (1920 , 1080 )
5858 driver .get (query_url )
5959 image_urls = image_url_from_webpage (driver , max_number )
@@ -72,6 +72,6 @@ def crawl_image_urls(keywords, filters, max_number=10000, proxy=None, proxy_type
7272
7373if __name__ == '__main__' :
7474 images = crawl_image_urls (
75- "mbot png" , "+filterui:aspect-square" , max_number = 10 )
75+ "cat png" , "+filterui:aspect-square" , max_number = 10 )
7676 for i in images :
7777 print (i + "\n " )
0 commit comments