Advertisement

crawler1.py

Jackspade9624

May 30th, 2025 (edited)

16

0

Never

Add comment

Not a member of Pastebin yet? Sign Up, it unlocks many cool features!

text 1.17 KB | None | 0 0

raw download clone embed print report

#!/usr/bin/env python3
import requests
from bs4 import BeautifulSoup
def crawl_page(url):
"""Fetches and parses a webpage, extracting links."""
try:
response = requests.get(url)
response.raise_for_status() # Raise an exception for bad status codes
soup = BeautifulSoup(response.text, 'html.parser')
links = soup.find_all('a', href=True)
return links
except requests.exceptions.RequestException as e:
print(f"Error fetching {url}: {e}")
return []
def main():
"""Prompts the user for a URL and crawls the page."""
while True:
url = input("Enter the URL to crawl (or type 'exit' to quit): ")
if url.lower() == 'exit':
break
if not url.startswith("http://") and not url.startswith("https://"):
print("Please enter a valid URL (e.g., http://example.com)")
continue
print(f"Crawling: {url}")
links = crawl_page(url)
if links:
for link in links:
print(link['href'])
else:
print("No links found or error occurred.")
if __name__ == "__main__":
main()

Advertisement

Add Comment

Please, Sign In to add comment

Advertisement

Public Pastes

Netflix Premium UHD Hits
JavaScript | 2 sec ago | 0.08 KB
Make $1200 in 15 minutes
JavaScript | 6 sec ago | 0.08 KB
✅ Account Leaks
JavaScript | 9 sec ago | 0.08 KB
✅ Account Leaks
JavaScript | 13 sec ago | 0.08 KB
FREE BTC GUIDE
JavaScript | 18 sec ago | 0.08 KB
GMAIL Logs (2FA disabled)
JavaScript | 21 sec ago | 0.08 KB
FREE 8TC GUIDE✅ O
JavaScript | 22 sec ago | 0.03 KB
GMAIL Logs (2FA disabled)
JavaScript | 25 sec ago | 0.08 KB

Advertisement