new update

Brivno1234 · web-flow · commit 89a2b66f7de6 · 2025-05-12T14:52:47.000+03:00
diff --git a/scripts/08_basic_email_web_crawler.py b/scripts/08_basic_email_web_crawler.py
@@ -1,21 +1,17 @@
-import requests
-import re
-
-# get url
-url = input('Enter a URL (include `http://`): ')
-
-# connect to the url
-website = requests.get(url)
-
-# read html
-html = website.text
-
-# use re.findall to grab all the links
-links = re.findall('"((http|ftp)s?://.*?)"', html)
-emails = re.findall('([\w\.,]+@[\w\.,]+\.\w+)', html)
-
-
-# print the number of links in the list
-print("\nFound {} links".format(len(links)))
-for email in emails:
-    print(email)
+from bs4 import BeautifulSoup 
+import requests
+
+
+
+
+url = input('Enter a URL (include `http://`): ')
+
+response = requests.get(url)
+html = response.text
+soup = BeautifulSoup(html,"html.parser")
+print(html)
+
+list = []
+for i in soup.find_all("a",href=True):
+    list.append(i)
+    print("leited kink: ", i)