Merge pull request #1723 from Tanya-1109/master

1e9abhi1e10 · web-flow · commit bd5b280286fc · 2023-06-09T22:17:01.000+05:30
Added link Scrapper
diff --git a/Readme.md b/Readme.md
@@ -0,0 +1,17 @@
+# LINK SCRAPPER
+
+
+- It is used to scrape links from any website and display it.
+
+
+## Setup instructions
+
+Any PC with python 3 installed can run this code.
+
+
+## Output
+image.png
+
+## Author(s)
+
+Tanya Mohanka
diff --git a/script.py b/script.py
@@ -0,0 +1,15 @@
+import requests
+from bs4 import BeautifulSoup
+
+def scrape_links(url):
+    response = requests.get(url)
+    soup = BeautifulSoup(response.text, 'html.parser')
+    links = soup.find_all('a')
+    for link in links:
+        href = link.get('href')
+        if href and href.startswith('http'):  # Filter out non-HTTP links
+            print(href)
+
+# Example usage:
+url = 'https://www.linkedin.com/feed/'  # Replace with the URL of the website you want to scrape
+scrape_links(url)