Merge branch 'master' of gitea.gorillamail.biz:cid/Web_Scrape
This commit is contained in:
1
main.py
1
main.py
@ -3,6 +3,7 @@ from bs4 import BeautifulSoup
|
|||||||
from urllib.parse import urlparse, urlunparse
|
from urllib.parse import urlparse, urlunparse
|
||||||
import pandas as pd
|
import pandas as pd
|
||||||
|
|
||||||
|
headers = {'User-Agent': 'myprogram/1.0'}
|
||||||
def scrape_headings(url):
|
def scrape_headings(url):
|
||||||
try:
|
try:
|
||||||
# Check if the URL has a scheme (http/https), and add one if missing
|
# Check if the URL has a scheme (http/https), and add one if missing
|
||||||
|
|||||||
Reference in New Issue
Block a user