Merge branch 'master' of gitea.gorillamail.biz:cid/Web_Scrape

This commit is contained in:
2023-12-30 23:15:47 -05:00

View File

@ -3,6 +3,7 @@ from bs4 import BeautifulSoup
from urllib.parse import urlparse, urlunparse
import pandas as pd
headers = {'User-Agent': 'myprogram/1.0'}
def scrape_headings(url):
try:
# Check if the URL has a scheme (http/https), and add one if missing