(PYTHON) How to convert web-scrapping script into Python class? Example: from bs4 import BeautifulSoup import requests def openHtmlFile(htmlfile): f = open(htmlfile, 'https://en.wikipedia.org/wiki/List_of_countries_by_carbon_dioxide_emissions_per_ca pita') contents = f.read() return BeautifulSoup(contents, 'html.parser') scrape_site = requests.get('https://en.wikipedia.org/wiki/List_of_countries_by_carbon_dioxide_emi ssions_per_capita') soup = BeautifulSoup(scrape_site.text, 'html.parser') table = soup.find_all('table',{'class':'wikitable sortable jquery-tablesorter'}) for values in table: country = soup.find_all(soup,'td') year = soup.find_all(soup, 'th') column_country = [td.text for td in soup.find_all('td')] coulumn_year = [th.text for th in soup.find_all('th')] seperate_year = soup.find_all('th')[2:5] country = soup.find_all(soup,'td') #show 1980 column year_1980 = soup.find_all('th')[2] #show 2018 column year_2018 = soup.find_all('th')[5] print(country) print(year_1980) print(year_2018) No hand written and fast answer with explanation
(PYTHON) How to convert web-scrapping script into Python class? Example:
from bs4 import BeautifulSoup
import requests
def openHtmlFile(htmlfile):
f = open(htmlfile,
'https://en.wikipedia.org/wiki/List_of_countries_by_carbon_dioxide_emissions_per_ca
pita')
contents = f.read()
return BeautifulSoup(contents, 'html.parser')
scrape_site =
requests.get('https://en.wikipedia.org/wiki/List_of_countries_by_carbon_dioxide_emi
ssions_per_capita')
soup = BeautifulSoup(scrape_site.text, 'html.parser')
table = soup.find_all('table',{'class':'wikitable sortable jquery-tablesorter'})
for values in table:
country = soup.find_all(soup,'td')
year = soup.find_all(soup, 'th')
column_country = [td.text for td in soup.find_all('td')]
coulumn_year = [th.text for th in soup.find_all('th')]
seperate_year = soup.find_all('th')[2:5]
country = soup.find_all(soup,'td')
#show 1980 column
year_1980 = soup.find_all('th')[2]
#show 2018 column
year_2018 = soup.find_all('th')[5]
print(country)
print(year_1980)
print(year_2018)
No hand written and fast answer with explanation
Step by step
Solved in 3 steps with 2 images