kaustumbh7 · August 31, 2021 00:13 · jamtayyab · Aug 31, 2021
diff --git a/scraper.py b/scraper.py
 # import libraries
 from urllib.request import urlopen
 from bs4 import BeautifulSoup

 # specify the url
 url = "https://www.bbc.com/sport/football/46897172"

 # Connect to the website and return the html to the variable ‘page’
 try:
    page = urlopen(url)
 except:
    print("Error opening the URL")

 # parse the html using beautiful soup and store in variable `soup`
 soup = BeautifulSoup(page, 'html.parser')

 # Take out the <div> of name and get its value
 content = soup.find('div', {"class": "story-body sp-story-body gel-body-copy"})

 article = ''
 for i in content.findAll('p'):
    article = article + ' ' +  i.text
 print(article)

 # Saving the scraped text
 with open('scraped_text.txt', 'w') as file:
    file.write(article)
	# import libraries
	from urllib.request import urlopen
	from bs4 import BeautifulSoup

	# specify the url
	url = "https://www.bbc.com/sport/football/46897172"

	# Connect to the website and return the html to the variable ‘page’
	try:
	page = urlopen(url)
	except:
	print("Error opening the URL")

	# parse the html using beautiful soup and store in variable `soup`
	soup = BeautifulSoup(page, 'html.parser')

	# Take out the <div> of name and get its value
	content = soup.find('div', {"class": "story-body sp-story-body gel-body-copy"})

	article = ''
	for i in content.findAll('p'):
	article = article + ' ' + i.text
	print(article)

	# Saving the scraped text
	with open('scraped_text.txt', 'w') as file:
	file.write(article)